Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add GRPC thread CPU time metric #11772

Merged
merged 1 commit into from
Nov 25, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
8 changes: 4 additions & 4 deletions ydb/core/driver_lib/run/run.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -973,13 +973,13 @@ void TKikimrRunner::InitializeGRpc(const TKikimrRunConfig& runConfig) {
sslData.DoRequestClientCertificate = appConfig.GetClientCertificateAuthorization().GetRequestClientCertificate();
sslOpts.SetSslData(sslData);

GRpcServers.push_back({ "grpcs", new NYdbGrpc::TGRpcServer(sslOpts) });
GRpcServers.push_back({ "grpcs", new NYdbGrpc::TGRpcServer(sslOpts, Counters) });

fillFn(grpcConfig, *GRpcServers.back().second, sslOpts);
}

if (grpcConfig.GetPort()) {
GRpcServers.push_back({ "grpc", new NYdbGrpc::TGRpcServer(opts) });
GRpcServers.push_back({ "grpc", new NYdbGrpc::TGRpcServer(opts, Counters) });

fillFn(grpcConfig, *GRpcServers.back().second, opts);
}
Expand All @@ -996,7 +996,7 @@ void TKikimrRunner::InitializeGRpc(const TKikimrRunConfig& runConfig) {
xopts.SetEndpointId(ex.GetEndpointId());
}

GRpcServers.push_back({ "grpc", new NYdbGrpc::TGRpcServer(xopts) });
GRpcServers.push_back({ "grpc", new NYdbGrpc::TGRpcServer(xopts, Counters) });
fillFn(ex, *GRpcServers.back().second, xopts);
}

Expand Down Expand Up @@ -1035,7 +1035,7 @@ void TKikimrRunner::InitializeGRpc(const TKikimrRunConfig& runConfig) {
Y_ABORT_UNLESS(xopts.SslData->Cert, "Cert not set");
Y_ABORT_UNLESS(xopts.SslData->Key, "Key not set");

GRpcServers.push_back({ "grpcs", new NYdbGrpc::TGRpcServer(xopts) });
GRpcServers.push_back({ "grpcs", new NYdbGrpc::TGRpcServer(xopts, Counters) });
fillFn(ex, *GRpcServers.back().second, xopts);
}
}
Expand Down
3 changes: 2 additions & 1 deletion ydb/core/grpc_streaming/grpc_streaming_ut.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -95,12 +95,13 @@ class TGRpcTestServer {

Server->GetRuntime()->SetLogPriority(NKikimrServices::GRPC_SERVER, NActors::NLog::PRI_DEBUG);

TIntrusivePtr<::NMonitoring::TDynamicCounters> counters(MakeIntrusive<::NMonitoring::TDynamicCounters>());

NYdbGrpc::TServerOptions options;
options.SetPort(grpc);
GRpcServer.Reset(new NYdbGrpc::TGRpcServer(options));

auto* as = Server->GetRuntime()->GetAnyNodeActorSystem();
TIntrusivePtr<::NMonitoring::TDynamicCounters> counters(MakeIntrusive<::NMonitoring::TDynamicCounters>());

GRpcServer->AddService(new TStreamingService<TImplActor>(as, counters));
GRpcServer->Start();
Expand Down
6 changes: 3 additions & 3 deletions ydb/core/testlib/test_client.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -346,6 +346,9 @@ namespace Tests {
}

void TServer::EnableGRpc(const NYdbGrpc::TServerOptions& options, ui32 grpcServiceNodeId) {
GRpcServerRootCounters = MakeIntrusive<::NMonitoring::TDynamicCounters>();
auto& counters = GRpcServerRootCounters;

GRpcServer.reset(new NYdbGrpc::TGRpcServer(options));
auto grpcService = new NGRpcProxy::TGRpcService();

Expand Down Expand Up @@ -378,9 +381,6 @@ namespace Tests {
auto grpcMon = system->Register(NGRpcService::CreateGrpcMonService(), TMailboxType::ReadAsFilled, appData.UserPoolId);
system->RegisterLocalService(NGRpcService::GrpcMonServiceId(), grpcMon);

GRpcServerRootCounters = MakeIntrusive<::NMonitoring::TDynamicCounters>();
auto& counters = GRpcServerRootCounters;

// Setup discovery for typically used services on the node
{
TIntrusivePtr<NGRpcService::TGrpcEndpointDescription> desc = new NGRpcService::TGrpcEndpointDescription();
Expand Down
39 changes: 31 additions & 8 deletions ydb/library/grpc/server/grpc_server.cpp
Original file line number Diff line number Diff line change
@@ -1,5 +1,8 @@
#include "grpc_server.h"

#include <library/cpp/monlib/dynamic_counters/counters.h>
#include <library/cpp/time_provider/monotonic.h>

#include <util/string/join.h>
#include <util/generic/yexception.h>
#include <util/system/thread.h>
Expand All @@ -18,19 +21,31 @@

namespace NYdbGrpc {

using NThreading::TFuture;

static void PullEvents(grpc::ServerCompletionQueue* cq) {
static void PullEvents(grpc::ServerCompletionQueue* cq, TIntrusivePtr<::NMonitoring::TDynamicCounters> counters) {
TThread::SetCurrentThreadName("grpc_server");
auto okCounter = counters->GetCounter("RequestExecuted", true);
auto errorCounter = counters->GetCounter("RequestDestroyed", true);
auto cpuTime = counters->GetCounter("ThreadCPU", true);

NMonotonic::TMonotonic lastCpuTimeTs = {};
while (true) {
void* tag; // uniquely identifies a request.
bool ok;

auto now = NMonotonic::TMonotonic::Now();
if (now - lastCpuTimeTs >= TDuration::Seconds(1)) {
lastCpuTimeTs = now;
*cpuTime = ThreadCPUTime();
}

if (cq->Next(&tag, &ok)) {
IQueueEvent* const ev(static_cast<IQueueEvent*>(tag));

if (!ev->Execute(ok)) {
if (ev->Execute(ok)) {
okCounter->Inc();
} else {
ev->DestroyRequest();
errorCounter->Inc();
}
} else {
break;
Expand Down Expand Up @@ -103,10 +118,16 @@ void TGrpcServiceProtectiable::DecRequest() {
}
}

TGRpcServer::TGRpcServer(const TServerOptions& opts)
TGRpcServer::TGRpcServer(const TServerOptions& opts, TIntrusivePtr<::NMonitoring::TDynamicCounters> counters)
: Options_(opts)
, Counters_(std::move(counters))
, Limiter_(Options_.MaxGlobalRequestInFlight)
{}
{
if (!Counters_) {
// make a stub to simplify code
Counters_.Reset(new ::NMonitoring::TDynamicCounters());
}
}

TGRpcServer::~TGRpcServer() {
Y_ABORT_UNLESS(Ts.empty());
Expand Down Expand Up @@ -237,10 +258,12 @@ void TGRpcServer::Start() {
}

Ts.reserve(Options_.WorkerThreads);
auto grpcCounters = Counters_->GetSubgroup("counters", "grpc");
for (size_t i = 0; i < Options_.WorkerThreads; ++i) {
auto* cq = &CQS_[i % CQS_.size()];
Ts.push_back(SystemThreadFactory()->Run([cq] {
PullEvents(cq->get());
auto workerCounters = grpcCounters->GetSubgroup("worker", ToString(i));
Ts.push_back(SystemThreadFactory()->Run([cq, workerCounters] {
PullEvents(cq->get(), std::move(workerCounters));
}));
}

Expand Down
10 changes: 9 additions & 1 deletion ydb/library/grpc/server/grpc_server.h
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,10 @@

#include <grpcpp/grpcpp.h>

namespace NMonitoring {
struct TDynamicCounters;
} // NMonitoring

namespace NYdbGrpc {

struct TSslData {
Expand Down Expand Up @@ -349,8 +353,11 @@ class TGrpcServiceBase: public TGrpcServiceProtectiable {
class TGRpcServer {
public:
using IGRpcServicePtr = TIntrusivePtr<IGRpcService>;
TGRpcServer(const TServerOptions& opts);

// TODO: remove default nullptr after migration
TGRpcServer(const TServerOptions& opts, TIntrusivePtr<::NMonitoring::TDynamicCounters> counters = nullptr);
~TGRpcServer();

void AddService(IGRpcServicePtr service);
void Start();
// Send stop to registred services and call Shutdown on grpc server
Expand All @@ -365,6 +372,7 @@ class TGRpcServer {
using IThreadRef = TAutoPtr<IThreadFactory::IThread>;

const TServerOptions Options_;
TIntrusivePtr<::NMonitoring::TDynamicCounters> Counters_;
std::unique_ptr<grpc::Server> Server_;
std::vector<std::unique_ptr<grpc::ServerCompletionQueue>> CQS_;
TVector<IThreadRef> Ts;
Expand Down
Loading