We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent c95a3e4 commit 5eb8ea1Copy full SHA for 5eb8ea1
2 files changed
benchmarks/dsr1_fp4_gb200_dynamo-trt_slurm.sh
@@ -39,10 +39,11 @@ fi
39
40
kind=dynamo_disagg
41
additional_slurm_args="--time=04:00:00"
42
+ntasks_per_node=4
43
44
gen_nodes=$(((DECODE_TP + 3)/4 * DECODE_NUM_WORKERS))
45
total_nodes=$((PREFILL_NUM_WORKERS + gen_nodes))
-total_tasks=$((total_nodes * NTASKS_PER_NODE))
46
+total_tasks=$((total_nodes * ntasks_per_node))
47
48
decode_eplb_num_slots=0
49
runners/launch_gb200-nv.sh
@@ -8,8 +8,6 @@ set -x
8
export SLURM_PARTITION="batch"
9
export SLURM_ACCOUNT="benchmark"
10
export SLURM_JOB_NAME="benchmark-dynamo.job"
11
-# For GB200 we have 4 GPUs per node
12
-export NTASKS_PER_NODE=4
13
14
# For SGLang - we are working on updating the 8k1k configs
15
# For now we add conditionals to this script to use newer code for the 1k1k configs
0 commit comments