File tree Expand file tree Collapse file tree
benchmarks/multi_node/srt-slurm-recipes/sglang/deepseek-v4/8k1k Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -8759,7 +8759,7 @@ dsv4-fp4-gb300-dynamo-vllm:
87598759 dp-attn : true
87608760
87618761dsv4-fp4-gb300-dynamo-sglang :
8762- image : lmsysorg/sglang:nightly-dev-cu13-20260519-dbac4647
8762+ image : lmsysorg/sglang:nightly-dev-cu13-20260520-425dffbd
87638763 model : deepseek-ai/DeepSeek-V4-Pro
87648764 model-prefix : dsv4
87658765 runner : gb300-cw
Original file line number Diff line number Diff line change @@ -33,7 +33,7 @@ name: "disagg-gb300-10p1d-dep4-dep16-14-c8192"
3333
3434model :
3535 path : " deepseek-v4-pro"
36- container : " lmsysorg/sglang:nightly-dev-cu13-20260519-dbac4647 "
36+ container : " lmsysorg/sglang:nightly-dev-cu13-20260520-425dffbd "
3737 precision : " fp4"
3838
3939dynamo :
@@ -94,7 +94,6 @@ backend:
9494 SGLANG_LOG_FORWARD_ITERS : " 1"
9595 SGLANG_LOG_MS : " 1"
9696 SGLANG_REQUEST_STATE_WAIT_TIMEOUT : " 60"
97- SGLANG_OPT_FP8_WO_A_GEMM : " 0"
9897
9998 decode_environment :
10099 PYTHONUNBUFFERED : " 1"
@@ -119,7 +118,6 @@ backend:
119118 SGLANG_LOG_FORWARD_ITERS : " 1"
120119 SGLANG_LOG_MS : " 1"
121120 SGLANG_REQUEST_STATE_WAIT_TIMEOUT : " 60"
122- SGLANG_OPT_FP8_WO_A_GEMM : " 0"
123121 # is single-node only and corrupts results in 2-node decode setups.
124122
125123 sglang_config :
Original file line number Diff line number Diff line change @@ -33,7 +33,7 @@ name: "disagg-gb300-12p1d-dep4-dep12-15-c21504"
3333
3434model :
3535 path : " deepseek-v4-pro"
36- container : " lmsysorg/sglang:nightly-dev-cu13-20260519-dbac4647 "
36+ container : " lmsysorg/sglang:nightly-dev-cu13-20260520-425dffbd "
3737 precision : " fp4"
3838
3939dynamo :
@@ -94,7 +94,6 @@ backend:
9494 SGLANG_LOG_FORWARD_ITERS : " 1"
9595 SGLANG_LOG_MS : " 1"
9696 SGLANG_REQUEST_STATE_WAIT_TIMEOUT : " 60"
97- SGLANG_OPT_FP8_WO_A_GEMM : " 0"
9897
9998 decode_environment :
10099 PYTHONUNBUFFERED : " 1"
@@ -119,7 +118,6 @@ backend:
119118 SGLANG_LOG_FORWARD_ITERS : " 1"
120119 SGLANG_LOG_MS : " 1"
121120 SGLANG_REQUEST_STATE_WAIT_TIMEOUT : " 60"
122- SGLANG_OPT_FP8_WO_A_GEMM : " 0"
123121 # is single-node only and corrupts results in 2-node decode setups.
124122
125123 sglang_config :
Original file line number Diff line number Diff line change @@ -33,7 +33,7 @@ name: "disagg-gb300-1p1d-dep4-dep16-5-c1024"
3333
3434model :
3535 path : " deepseek-v4-pro"
36- container : " lmsysorg/sglang:nightly-dev-cu13-20260519-dbac4647 "
36+ container : " lmsysorg/sglang:nightly-dev-cu13-20260520-425dffbd "
3737 precision : " fp4"
3838
3939dynamo :
@@ -94,7 +94,6 @@ backend:
9494 SGLANG_LOG_FORWARD_ITERS : " 1"
9595 SGLANG_LOG_MS : " 1"
9696 SGLANG_REQUEST_STATE_WAIT_TIMEOUT : " 60"
97- SGLANG_OPT_FP8_WO_A_GEMM : " 0"
9897
9998 decode_environment :
10099 PYTHONUNBUFFERED : " 1"
@@ -119,7 +118,6 @@ backend:
119118 SGLANG_LOG_FORWARD_ITERS : " 1"
120119 SGLANG_LOG_MS : " 1"
121120 SGLANG_REQUEST_STATE_WAIT_TIMEOUT : " 60"
122- SGLANG_OPT_FP8_WO_A_GEMM : " 0"
123121 # is single-node only and corrupts results in 2-node decode setups.
124122
125123 sglang_config :
Original file line number Diff line number Diff line change @@ -33,7 +33,7 @@ name: "disagg-gb300-1p1d-tp4-tp4-2-c1"
3333
3434model :
3535 path : " deepseek-v4-pro"
36- container : " lmsysorg/sglang:nightly-dev-cu13-20260519-dbac4647 "
36+ container : " lmsysorg/sglang:nightly-dev-cu13-20260520-425dffbd "
3737 precision : " fp4"
3838
3939# See ../1k1k/disagg-gb200-1p1d-dep8-tep8.yaml for the dynamo pin
@@ -93,7 +93,6 @@ backend:
9393 SGLANG_DISAGGREGATION_BOOTSTRAP_TIMEOUT : " 100000"
9494 SGLANG_DISAGGREGATION_WAITING_TIMEOUT : " 100000"
9595 SGLANG_OPT_SWA_RELEASE_LEAF_LOCK_AFTER_WINDOW : " 1"
96- SGLANG_OPT_FP8_WO_A_GEMM : " 0"
9796
9897 decode_environment :
9998 PYTHONUNBUFFERED : " 1"
@@ -110,7 +109,6 @@ backend:
110109 SGLANG_DISAGGREGATION_BOOTSTRAP_TIMEOUT : " 100000"
111110 SGLANG_DISAGGREGATION_WAITING_TIMEOUT : " 100000"
112111 SGLANG_OPT_SWA_RELEASE_LEAF_LOCK_AFTER_WINDOW : " 1"
113- SGLANG_OPT_FP8_WO_A_GEMM : " 0"
114112 # is single-node only and corrupts results in 2-node decode setups.
115113
116114 sglang_config :
Original file line number Diff line number Diff line change @@ -33,7 +33,7 @@ name: "disagg-gb300-4p1d-dep4-dep16-8-c1024"
3333
3434model :
3535 path : " deepseek-v4-pro"
36- container : " lmsysorg/sglang:nightly-dev-cu13-20260519-dbac4647 "
36+ container : " lmsysorg/sglang:nightly-dev-cu13-20260520-425dffbd "
3737 precision : " fp4"
3838
3939dynamo :
@@ -94,7 +94,6 @@ backend:
9494 SGLANG_LOG_FORWARD_ITERS : " 1"
9595 SGLANG_LOG_MS : " 1"
9696 SGLANG_REQUEST_STATE_WAIT_TIMEOUT : " 60"
97- SGLANG_OPT_FP8_WO_A_GEMM : " 0"
9897
9998 decode_environment :
10099 PYTHONUNBUFFERED : " 1"
@@ -119,7 +118,6 @@ backend:
119118 SGLANG_LOG_FORWARD_ITERS : " 1"
120119 SGLANG_LOG_MS : " 1"
121120 SGLANG_REQUEST_STATE_WAIT_TIMEOUT : " 60"
122- SGLANG_OPT_FP8_WO_A_GEMM : " 0"
123121 # is single-node only and corrupts results in 2-node decode setups.
124122
125123 sglang_config :
Original file line number Diff line number Diff line change @@ -33,7 +33,7 @@ name: "disagg-gb300-8p1d-dep4-dep16-12-c4096"
3333
3434model :
3535 path : " deepseek-v4-pro"
36- container : " lmsysorg/sglang:nightly-dev-cu13-20260519-dbac4647 "
36+ container : " lmsysorg/sglang:nightly-dev-cu13-20260520-425dffbd "
3737 precision : " fp4"
3838
3939dynamo :
@@ -94,7 +94,6 @@ backend:
9494 SGLANG_LOG_FORWARD_ITERS : " 1"
9595 SGLANG_LOG_MS : " 1"
9696 SGLANG_REQUEST_STATE_WAIT_TIMEOUT : " 60"
97- SGLANG_OPT_FP8_WO_A_GEMM : " 0"
9897
9998 decode_environment :
10099 PYTHONUNBUFFERED : " 1"
@@ -119,7 +118,6 @@ backend:
119118 SGLANG_LOG_FORWARD_ITERS : " 1"
120119 SGLANG_LOG_MS : " 1"
121120 SGLANG_REQUEST_STATE_WAIT_TIMEOUT : " 60"
122- SGLANG_OPT_FP8_WO_A_GEMM : " 0"
123121 # is single-node only and corrupts results in 2-node decode setups.
124122
125123 sglang_config :
You can’t perform that action at this time.
0 commit comments