Skip to content

Commit 2cc19a3

Browse files
committed
more
1 parent 297bd7f commit 2cc19a3

3 files changed

Lines changed: 40 additions & 0 deletions

File tree

.github/configs/nvidia-master.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -798,6 +798,7 @@ dsr1-fp8-gb200-dynamo-sglang:
798798
additional-settings:
799799
- "PREFILL_NODES=4"
800800
- "N_ADDITIONAL_FRONTENDS=9"
801+
- "SCRIPT_MODE=max-tpt"
801802
decode:
802803
num-worker: 1
803804
tp: 1
Lines changed: 37 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,37 @@
1+
2+
#!/bin/bash
3+
4+
set -x
5+
6+
source "$(dirname "$0")/benchmark_lib.sh"
7+
8+
check_env_vars CONC_LIST ISL OSL IMAGE SPEC_DECODING MODEL_PATH \
9+
PREFILL_NUM_WORKERS PREFILL_TP PREFILL_EP PREFILL_DP_ATTN \
10+
DECODE_NUM_WORKERS DECODE_TP DECODE_EP DECODE_DP_ATTN \
11+
PREFILL_NODES DECODE_NODES N_ADDITIONAL_FRONTENDS SGL_SLURM_JOBS_PATH # SGL_SLURM_JOBS_PATH FIXME
12+
13+
# Always clone and setup Dynamo
14+
echo "Cloning Dynamo repository..."
15+
git clone --branch ishan/sa-1.1-sgl-dsr1 https://github.com/ai-dynamo/dynamo.git
16+
17+
cd "$SGL_SLURM_JOBS_PATH"
18+
19+
# Set up SGL launch script-specific environment variables
20+
export TIME_LIMIT="04:00:00"
21+
export MODEL_PATH=$MODEL_PATH
22+
export CONFIG_DIR=$CONFIG_DIR
23+
export CONTAINER_IMAGE=$IMAGE
24+
export GPU_TYPE="gb200-fp4"
25+
26+
# Launch jobs based on ISL/OSL
27+
# Replace ' ' in CONC_LIST with 'x' such that the concurrency list is represented
28+
# by a list of numbers delimted by 'x'. This is because of how the underlying launch script
29+
# expects the concurrencies.
30+
bash ./submit_disagg.sh $PREFILL_NODES \
31+
$PREFILL_NUM_WORKERS \
32+
$DECODE_NODES \
33+
$DECODE_NUM_WORKERS \
34+
$N_ADDITIONAL_FRONTENDS \
35+
$ISL $OSL "${CONC_LIST// /x}" inf \
36+
$GPU_TYPE \
37+
$SCRIPT_MODE

benchmarks/dsr1_fp8_gb200_dynamo-sglang_slurm.sh

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,7 @@ export TIME_LIMIT="04:00:00"
2121
export MODEL_PATH=$MODEL_PATH
2222
export CONFIG_DIR=$CONFIG_DIR
2323
export CONTAINER_IMAGE=$IMAGE
24+
export GPU_TYPE="gb200-fp8"
2425

2526
# Launch jobs based on ISL/OSL
2627
# Replace ' ' in CONC_LIST with 'x' such that the concurrency list is represented
@@ -32,4 +33,5 @@ bash ./submit_disagg.sh $PREFILL_NODES \
3233
$DECODE_NUM_WORKERS \
3334
$N_ADDITIONAL_FRONTENDS \
3435
$ISL $OSL "${CONC_LIST// /x}" inf \
36+
$GPU_TYPE \
3537
$SCRIPT_MODE

0 commit comments

Comments
 (0)