Skip to content

Commit dc9f6df

Browse files
committed
issue/340 - fix(llm): guard PD config and restore static scheduler step
1 parent dc37614 commit dc9f6df

3 files changed

Lines changed: 16 additions & 1 deletion

File tree

python/infinilm/config/engine_config.py

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -43,3 +43,11 @@ class EngineConfig:
4343
attn_backend: str = "default"
4444
skip_load: bool = False
4545
kv_transfer_config: Optional[KVTransferConfig] = None
46+
47+
def __post_init__(self) -> None:
48+
if (
49+
self.kv_transfer_config is not None
50+
and self.kv_transfer_config.kv_connector
51+
and self.cache_type != "paged"
52+
):
53+
raise ValueError("kv_transfer_config requires cache_type='paged'")

python/infinilm/llm/model_runner/model_runner.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -86,7 +86,10 @@ def __init__(self, config: EngineConfig):
8686

8787
# Initialize KV connector
8888
self.kv_connector = None
89-
if self.kv_transfer_config is not None:
89+
if (
90+
self.kv_transfer_config is not None
91+
and self.kv_transfer_config.kv_connector
92+
):
9093
connector_name = self.kv_transfer_config.kv_connector
9194
self.kv_connector = KVConnectorFactory.create_connector(
9295
connector_name=connector_name,

python/infinilm/llm/static_scheduler.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -223,6 +223,10 @@ def update_cache(self):
223223
f"update_cache: cached_block_hashes now has {len(self.cached_block_hashes)} blocks"
224224
)
225225

226+
def update_from_output(self, model_output):
227+
"""Static cache has no scheduler-side connector state to update."""
228+
return None
229+
226230
def complete_requests(self, requests: List[InferenceRequest]):
227231
"""Handle completed requests."""
228232
for req in requests:

0 commit comments

Comments
 (0)