Skip to content

Commit 2276319

Browse files
committed
[Metrics] move prompt_tokens_total report to main process
1 parent 529ec9e commit 2276319

2 files changed

Lines changed: 4 additions & 4 deletions

File tree

fastdeploy/engine/common_engine.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1339,6 +1339,9 @@ def _insert_zmq_task_to_scheduler(self):
13391339

13401340
request.metrics.scheduler_recv_req_time = time.time()
13411341
main_process_metrics.inc_value("requests_number")
1342+
main_process_metrics.inc_value("prompt_tokens_total", request.prompt_token_ids_len)
1343+
main_process_metrics.obs_value("request_prompt_tokens", request.prompt_token_ids_len)
1344+
main_process_metrics.obs_value("request_params_max_tokens", request.sampling_params.max_tokens)
13421345
trace_carrier = data.get("trace_carrier")
13431346
if trace_carrier:
13441347
request_id = get_base_request_id(data["request_id"])

fastdeploy/entrypoints/engine_client.py

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -53,7 +53,6 @@
5353
log_request,
5454
log_request_error,
5555
)
56-
from fastdeploy.metrics.metrics import main_process_metrics
5756
from fastdeploy.platforms import current_platform
5857
from fastdeploy.trace.constants import LoggingEventName
5958
from fastdeploy.trace.trace_logger import print as trace_print
@@ -374,9 +373,7 @@ async def add_requests(self, task):
374373

375374
if "messages" in task:
376375
task["messages"] = None
377-
main_process_metrics.obs_value("request_params_max_tokens", task["max_tokens"])
378-
main_process_metrics.inc_value("prompt_tokens_total", input_ids_len)
379-
main_process_metrics.obs_value("request_prompt_tokens", input_ids_len)
376+
380377
except Exception as e:
381378
log_request_error(
382379
message="request[{request_id}] add_requests error: {error}, {traceback}",

0 commit comments

Comments
 (0)