Skip to content

Commit 7c0cb09

Browse files
committed
feat(profile): add B300 DeepSeek V4 Flash config
1 parent dd551f3 commit 7c0cb09

2 files changed

Lines changed: 19 additions & 1 deletion

File tree

.github/configs/nvidia-master.yaml

Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2038,6 +2038,24 @@ dsv4-fp4-b300-sglang:
20382038
- { tp: 8, ep: 8, dp-attn: true, conc-start: 2048, conc-end: 2048 }
20392039
- { tp: 8, ep: 8, dp-attn: true, conc-start: 4096, conc-end: 4096 }
20402040

2041+
# Targeted single-point Flash config for profile.yml. Keep the existing Pro
2042+
# sweep entry above unchanged; this profile-only key reuses the same B300
2043+
# SGLang launch path at the 1k1k, conc=64 point.
2044+
dsv4-flash-fp4-b300-sglang:
2045+
image: lmsysorg/sglang:deepseek-v4-b300@sha256:2fec8d7958bb0d53b50d7bf04d6ae6a7de8a35503775826e0550a45dd8c3ee15
2046+
model: deepseek-ai/DeepSeek-V4-Flash
2047+
model-prefix: dsv4
2048+
runner: b300
2049+
precision: fp4
2050+
framework: sglang
2051+
multinode: false
2052+
scenarios:
2053+
fixed-seq-len:
2054+
- isl: 1024
2055+
osl: 1024
2056+
search-space:
2057+
- { tp: 4, ep: 1, conc-start: 64, conc-end: 64 }
2058+
20412059
# DeepSeek-V4-Pro on B300 with EAGLE/MTP speculative decoding. Recipe is
20422060
# selected inside benchmarks/single_node/dsv4_fp4_b300_sglang_mtp.sh by
20432061
# DP_ATTENTION:

runners/launch_b300-nv.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -287,7 +287,7 @@ else
287287
HF_HUB_CACHE_MOUNT="/data/models"
288288
if [[ "$MODEL" == "Qwen/Qwen3.5-397B-A17B-FP8" ]]; then
289289
export MODEL="$HF_HUB_CACHE_MOUNT/${MODEL#*/}"
290-
elif [[ "$MODEL_PREFIX" == "dsv4" ]]; then
290+
elif [[ "$MODEL_PREFIX" == "dsv4" && "$MODEL" == "deepseek-ai/DeepSeek-V4-Pro" ]]; then
291291
export MODEL="$HF_HUB_CACHE_MOUNT/dsv4-pro"
292292
fi
293293
SQUASH_FILE="/data/home/sa-shared/gharunners/squash/$(echo "$IMAGE" | sed 's/[\/:@#]/_/g').sqsh"

0 commit comments

Comments
 (0)