@@ -131,11 +131,11 @@ def __init__(
131131 f"{ self .cache_config .bytes_per_token_per_layer / self .config .parallel_config .tensor_parallel_size } "
132132 )
133133
134- main_process_metrics .max_gpu_block_num . set ( self .num_gpu_blocks )
135- main_process_metrics .max_cpu_block_num . set ( self .num_cpu_blocks )
136- main_process_metrics .available_gpu_block_num . set ( self .num_gpu_blocks )
137- main_process_metrics .free_gpu_block_num . set ( self .num_gpu_blocks )
138- main_process_metrics .available_gpu_resource . set ( 1.0 )
134+ main_process_metrics .set_value ( "max_gpu_block_num" , self .num_gpu_blocks )
135+ main_process_metrics .set_value ( "max_cpu_block_num" , self .num_cpu_blocks )
136+ main_process_metrics .set_value ( "available_gpu_block_num" , self .num_gpu_blocks )
137+ main_process_metrics .set_value ( "free_gpu_block_num" , self .num_gpu_blocks )
138+ main_process_metrics .set_value ( "available_gpu_resource" , 1.0 )
139139
140140 def _get_kv_cache_shape (self , max_block_num ):
141141 from fastdeploy .model_executor .layers .attention import get_attention_backend
@@ -462,11 +462,11 @@ def update_cache_config(self, cache_config):
462462 heapq .heapify (self .gpu_free_block_list )
463463 self .node_id_pool = list (range (self .num_gpu_blocks + self .num_cpu_blocks ))
464464
465- main_process_metrics .max_gpu_block_num . set ( self .num_gpu_blocks )
466- main_process_metrics .max_cpu_block_num . set ( self .num_cpu_blocks )
467- main_process_metrics .available_gpu_block_num . set ( self .num_gpu_blocks )
468- main_process_metrics .free_gpu_block_num . set ( self .num_gpu_blocks )
469- main_process_metrics .available_gpu_resource . set ( 1.0 )
465+ main_process_metrics .set_value ( "max_gpu_block_num" , self .num_gpu_blocks )
466+ main_process_metrics .set_value ( "max_cpu_block_num" , self .num_cpu_blocks )
467+ main_process_metrics .set_value ( "available_gpu_block_num" , self .num_gpu_blocks )
468+ main_process_metrics .set_value ( "free_gpu_block_num" , self .num_gpu_blocks )
469+ main_process_metrics .set_value ( "available_gpu_resource" , 1.0 )
470470
471471 def can_allocate_gpu_blocks (self , num_blocks : int , try_free_gpu_blocks : bool = True ):
472472 """
@@ -494,8 +494,8 @@ def allocate_gpu_blocks(self, num_blocks, req_id=None):
494494 logger .info (
495495 f"req_id:{ req_id } allocate_gpu_blocks: { allocated_block_ids } , len(self.gpu_free_block_list) { len (self .gpu_free_block_list )} "
496496 )
497- main_process_metrics .free_gpu_block_num . set ( len (self .gpu_free_block_list ))
498- main_process_metrics .available_gpu_resource . set ( self .available_gpu_resource )
497+ main_process_metrics .set_value ( "free_gpu_block_num" , len (self .gpu_free_block_list ))
498+ main_process_metrics .set_value ( "available_gpu_resource" , self .available_gpu_resource )
499499 return allocated_block_ids
500500
501501 def recycle_gpu_blocks (self , gpu_block_ids , req_id = None ):
@@ -529,8 +529,8 @@ def recycle_gpu_blocks(self, gpu_block_ids, req_id=None):
529529 else :
530530 heapq .heappush (self .gpu_free_block_list , gpu_block_ids )
531531 logger .debug (f"req_id:{ req_id } recycle blocks end" )
532- main_process_metrics .free_gpu_block_num . set ( len (self .gpu_free_block_list ))
533- main_process_metrics .available_gpu_resource . set ( self .available_gpu_resource )
532+ main_process_metrics .set_value ( "free_gpu_block_num" , len (self .gpu_free_block_list ))
533+ main_process_metrics .set_value ( "available_gpu_resource" , self .available_gpu_resource )
534534
535535 def allocate_cpu_blocks (self , num_blocks ):
536536 """
@@ -2296,9 +2296,9 @@ def reset(self, wait_for_tasks_done=False):
22962296
22972297 # reset metrics
22982298 self .metrics .reset_metrics ()
2299- main_process_metrics .free_gpu_block_num . set ( len (self .gpu_free_block_list ))
2300- main_process_metrics .available_gpu_block_num . set ( len (self .gpu_free_block_list ))
2301- main_process_metrics .available_gpu_resource . set ( self .available_gpu_resource )
2299+ main_process_metrics .set_value ( "free_gpu_block_num" , len (self .gpu_free_block_list ))
2300+ main_process_metrics .set_value ( "available_gpu_block_num" , len (self .gpu_free_block_list ))
2301+ main_process_metrics .set_value ( "available_gpu_resource" , self .available_gpu_resource )
23022302
23032303 def clear_prefix_cache (self ):
23042304 """
0 commit comments