@@ -237,7 +237,6 @@ def __init__(self, vllm_config: "VllmConfig", role: KVConnectorRole):
237237 ucm_config = Config (vllm_config .kv_transfer_config )
238238 self .engine_id = vllm_config .kv_transfer_config .engine_id
239239 self .launch_config = ucm_config .get_config ()
240- logger .info (f"self.launch_config: { self .launch_config } " )
241240 self .connector_configs = self .launch_config .get ("ucm_connectors" , [])
242241 self .enable_event_sync = self .launch_config .get ("enable_event_sync" , True )
243242 assert len (self .connector_configs ) > 0 , "no storage connector name in config."
@@ -853,11 +852,7 @@ def wait_for_save(self) -> None:
853852class UCMCPConnector (UCMLayerWiseConnector ):
854853 def __init__ (self , vllm_config : "VllmConfig" , role : KVConnectorRole ):
855854 super ().__init__ (vllm_config , role )
856- self .use_layerwise = (
857- self ._vllm_config .kv_transfer_config .kv_connector_extra_config .get (
858- "use_layerwise" , False
859- )
860- )
855+ self .use_layerwise = self .launch_config .get ("use_layerwise" , False )
861856
862857 try :
863858 from vllm .distributed import get_dcp_group , get_pcp_group
@@ -1120,22 +1115,21 @@ class UCMConnector(KVConnectorBase_V1):
11201115 def __init__ (self , vllm_config : "VllmConfig" , role : KVConnectorRole ):
11211116 super ().__init__ (vllm_config = vllm_config , role = role )
11221117 self .connector : KVConnectorBase_V1
1123- # TODO new conn by config
1118+ ucm_config = Config (vllm_config .kv_transfer_config )
1119+ self .launch_config = ucm_config .get_config ()
1120+ logger .info (f"self.launch_config: { self .launch_config } " )
1121+
11241122 use_layerwise = (
1125- self ._vllm_config . kv_transfer_config . kv_connector_extra_config . get (
1126- "use_layerwise" , False
1127- )
1123+ self .launch_config . get ("use_layerwise" , False )
1124+ if self . launch_config is not None
1125+ else False
11281126 )
11291127 pp_enabled = self ._vllm_config .parallel_config .pipeline_parallel_size > 1
11301128 if pp_enabled and not use_layerwise :
11311129 raise RuntimeError (
11321130 "Pipeline parallelism is not supported in UCMDirectConnector, please set use_layerwise=True."
11331131 )
1134- if (
1135- self ._vllm_config .kv_transfer_config is not None
1136- and "hit_ratio"
1137- in self ._vllm_config .kv_transfer_config .kv_connector_extra_config
1138- ):
1132+ if self .launch_config is not None and "hit_ratio" in self .launch_config :
11391133 self .connector = UCMMockConnector (vllm_config , role )
11401134 elif (
11411135 hasattr (self ._vllm_config .parallel_config , "prefill_context_parallel_size" )
@@ -1147,12 +1141,7 @@ def __init__(self, vllm_config: "VllmConfig", role: KVConnectorRole):
11471141 > 1
11481142 ):
11491143 self .connector = UCMCPConnector (vllm_config , role )
1150- elif (
1151- self ._vllm_config .kv_transfer_config is not None
1152- and self ._vllm_config .kv_transfer_config .kv_connector_extra_config .get (
1153- "use_layerwise" , False
1154- )
1155- ):
1144+ elif use_layerwise :
11561145 self .connector = UCMLayerWiseConnector (vllm_config , role )
11571146 else :
11581147 self .connector = UCMDirectConnector (vllm_config , role )
0 commit comments