File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -24,6 +24,8 @@ enable_event_sync: true
2424# Enable UCM metrics so they can be monitored online via Grafana and Prometheus.
2525# metrics_config_path: "/workspace/unified-cache-management/examples/metrics/metrics_configs.yaml"
2626
27+ chunk_size : 256
28+
2729# Sparse attention configuration
2830# ucm_sparse_config:
2931 # GSAOnDevice: {}
Original file line number Diff line number Diff line change @@ -96,6 +96,7 @@ def test_online_accuracy_hbm_ssd_mixed(
9696 if ucm_connector_name == "UcmNfsStore"
9797 else {}
9898 ),
99+ "chunk_size" : 256 ,
99100 }
100101
101102 # Build vllm_server_startup_args
@@ -183,6 +184,7 @@ def test_online_accuracy_hbm_ssd_mixed_pp(
183184 if ucm_connector_name == "UcmNfsStore"
184185 else {}
185186 ),
187+ "chunk_size" : 256 ,
186188 }
187189
188190 # Build vllm_server_startup_args with pipeline parallel size
@@ -256,6 +258,7 @@ def test_online_accuracy_hbm_ssd_mixed_tp(
256258 if ucm_connector_name == "UcmNfsStore"
257259 else {}
258260 ),
261+ "chunk_size" : 256 ,
259262 }
260263
261264 # Build vllm_server_startup_args with tensor parallel size
You can’t perform that action at this time.
0 commit comments