File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -1339,6 +1339,9 @@ def _insert_zmq_task_to_scheduler(self):
13391339
13401340 request .metrics .scheduler_recv_req_time = time .time ()
13411341 main_process_metrics .inc_value ("requests_number" )
1342+ main_process_metrics .inc_value ("prompt_tokens_total" , request .prompt_token_ids_len )
1343+ main_process_metrics .obs_value ("request_prompt_tokens" , request .prompt_token_ids_len )
1344+ main_process_metrics .obs_value ("request_params_max_tokens" , request .sampling_params .max_tokens )
13421345 trace_carrier = data .get ("trace_carrier" )
13431346 if trace_carrier :
13441347 request_id = get_base_request_id (data ["request_id" ])
Original file line number Diff line number Diff line change 5353 log_request ,
5454 log_request_error ,
5555)
56- from fastdeploy .metrics .metrics import main_process_metrics
5756from fastdeploy .platforms import current_platform
5857from fastdeploy .trace .constants import LoggingEventName
5958from fastdeploy .trace .trace_logger import print as trace_print
@@ -374,9 +373,7 @@ async def add_requests(self, task):
374373
375374 if "messages" in task :
376375 task ["messages" ] = None
377- main_process_metrics .obs_value ("request_params_max_tokens" , task ["max_tokens" ])
378- main_process_metrics .inc_value ("prompt_tokens_total" , input_ids_len )
379- main_process_metrics .obs_value ("request_prompt_tokens" , input_ids_len )
376+
380377 except Exception as e :
381378 log_request_error (
382379 message = "request[{request_id}] add_requests error: {error}, {traceback}" ,
You can’t perform that action at this time.
0 commit comments