Skip to content

Commit

Permalink
feat: add perf-counter to record dropped timeout rpc count (XiaoMi#859)
Browse files Browse the repository at this point in the history
  • Loading branch information
hycdong committed Sep 1, 2021
1 parent cb93d91 commit b87c7e2
Show file tree
Hide file tree
Showing 5 changed files with 31 additions and 1 deletion.
1 change: 1 addition & 0 deletions include/dsn/tool-api/task.h
Original file line number Diff line number Diff line change
Expand Up @@ -439,6 +439,7 @@ class rpc_request_task : public task
spec().name.c_str(),
_request->header->from_address.to_string(),
_request->header->client.timeout_ms);
spec().on_rpc_task_dropped.execute(this);
}
}

Expand Down
1 change: 1 addition & 0 deletions include/dsn/tool-api/task_spec.h
Original file line number Diff line number Diff line change
Expand Up @@ -221,6 +221,7 @@ class task_spec : public extensible_object<task_spec, 4>
join_point<bool, task *, message_ex *, rpc_response_task *>
on_rpc_call; // return true means continue, otherwise dropped and (optionally) timedout
join_point<bool, rpc_request_task *> on_rpc_request_enqueue;
join_point<void, rpc_request_task *> on_rpc_task_dropped; // rpc task dropped

// RPC_RESPONSE
join_point<bool, task *, message_ex *> on_rpc_reply;
Expand Down
28 changes: 27 additions & 1 deletion src/runtime/profiler.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -106,7 +106,12 @@ counter_info *counter_info_ptr[] = {
"TIMEOUT(#/s)",
"#/s"),
new counter_info(
{"task.inqueue", "tiq"}, TASK_IN_QUEUE, COUNTER_TYPE_NUMBER, "InQueue(#)", "#")};
{"task.inqueue", "tiq"}, TASK_IN_QUEUE, COUNTER_TYPE_NUMBER, "InQueue(#)", "#"),
new counter_info({"rpc.dropped", "rdit"},
RPC_DROPPED_IF_TIMEOUT,
COUNTER_TYPE_NUMBER,
"RPC.DROPPED(#)",
"#")};

// call normal task
static void profiler_on_task_create(task *caller, task *callee)
Expand Down Expand Up @@ -269,6 +274,15 @@ static void profiler_on_rpc_request_enqueue(rpc_request_task *callee)
}
}

static void profile_on_rpc_task_dropped(rpc_request_task *callee)
{
auto code = callee->spec().code;
auto ptr = s_spec_profilers[code].ptr[RPC_DROPPED_IF_TIMEOUT].get();
if (ptr != nullptr) {
ptr->increment();
}
}

static void profiler_on_rpc_create_response(message_ex *req, message_ex *resp)
{
message_ext_for_profiler::get(resp) = message_ext_for_profiler::get(req);
Expand Down Expand Up @@ -543,6 +557,17 @@ void profiler::install(service_spec &)
COUNTER_TYPE_NUMBER_PERCENTILES,
"");
}
if (dsn_config_get_value_bool(
section_name.c_str(),
"rpc_request_dropped_before_execution_when_timeout",
false,
"whether to profile the number of rpc dropped for timeout"))
s_spec_profilers[i].ptr[RPC_DROPPED_IF_TIMEOUT].init_global_counter(
"zion",
"profiler",
(name + std::string(".rpc.dropped")).c_str(),
COUNTER_TYPE_NUMBER,
"rpc dropped if queue time exceed client timeout");
} else if (spec->type == dsn_task_type_t::TASK_TYPE_RPC_RESPONSE) {
if (dsn_config_get_value_bool(section_name.c_str(),
"profiler::latency.client",
Expand Down Expand Up @@ -601,6 +626,7 @@ void profiler::install(service_spec &)
spec->on_aio_enqueue.put_back(profiler_on_aio_enqueue, "profiler");
spec->on_rpc_call.put_back(profiler_on_rpc_call, "profiler");
spec->on_rpc_request_enqueue.put_back(profiler_on_rpc_request_enqueue, "profiler");
spec->on_rpc_task_dropped.put_back(profile_on_rpc_task_dropped, "profiler");
spec->on_rpc_create_response.put_back(profiler_on_rpc_create_response, "profiler");
spec->on_rpc_reply.put_back(profiler_on_rpc_reply, "profiler");
spec->on_rpc_response_enqueue.put_back(profiler_on_rpc_response_enqueue, "profiler");
Expand Down
1 change: 1 addition & 0 deletions src/runtime/profiler_header.h
Original file line number Diff line number Diff line change
Expand Up @@ -51,6 +51,7 @@ enum perf_counter_ptr_type
RPC_CLIENT_NON_TIMEOUT_LATENCY_NS,
RPC_CLIENT_TIMEOUT_THROUGHPUT,
TASK_IN_QUEUE,
RPC_DROPPED_IF_TIMEOUT,

PERF_COUNTER_COUNT,
PERF_COUNTER_INVALID
Expand Down
1 change: 1 addition & 0 deletions src/runtime/task/task_spec.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -162,6 +162,7 @@ task_spec::task_spec(int code,

on_rpc_call((std::string(name) + std::string(".rpc.call")).c_str()),
on_rpc_request_enqueue((std::string(name) + std::string(".rpc.request.enqueue")).c_str()),
on_rpc_task_dropped((std::string(name) + std::string(".dropped")).c_str()),
on_rpc_reply((std::string(name) + std::string(".rpc.reply")).c_str()),
on_rpc_response_enqueue((std::string(name) + std::string(".rpc.response.enqueue")).c_str()),
on_rpc_create_response((std::string(name) + std::string("rpc.create.response")).c_str())
Expand Down

0 comments on commit b87c7e2

Please sign in to comment.