File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -798,6 +798,7 @@ dsr1-fp8-gb200-dynamo-sglang:
798798 additional-settings :
799799 - " PREFILL_NODES=4"
800800 - " N_ADDITIONAL_FRONTENDS=9"
801+ - " SCRIPT_MODE=max-tpt"
801802 decode :
802803 num-worker : 1
803804 tp : 1
Original file line number Diff line number Diff line change 1+
2+ #! /bin/bash
3+
4+ set -x
5+
6+ source " $( dirname " $0 " ) /benchmark_lib.sh"
7+
8+ check_env_vars CONC_LIST ISL OSL IMAGE SPEC_DECODING MODEL_PATH \
9+ PREFILL_NUM_WORKERS PREFILL_TP PREFILL_EP PREFILL_DP_ATTN \
10+ DECODE_NUM_WORKERS DECODE_TP DECODE_EP DECODE_DP_ATTN \
11+ PREFILL_NODES DECODE_NODES N_ADDITIONAL_FRONTENDS SGL_SLURM_JOBS_PATH # SGL_SLURM_JOBS_PATH FIXME
12+
13+ # Always clone and setup Dynamo
14+ echo " Cloning Dynamo repository..."
15+ git clone --branch ishan/sa-1.1-sgl-dsr1 https://github.com/ai-dynamo/dynamo.git
16+
17+ cd " $SGL_SLURM_JOBS_PATH "
18+
19+ # Set up SGL launch script-specific environment variables
20+ export TIME_LIMIT=" 04:00:00"
21+ export MODEL_PATH=$MODEL_PATH
22+ export CONFIG_DIR=$CONFIG_DIR
23+ export CONTAINER_IMAGE=$IMAGE
24+ export GPU_TYPE=" gb200-fp4"
25+
26+ # Launch jobs based on ISL/OSL
27+ # Replace ' ' in CONC_LIST with 'x' such that the concurrency list is represented
28+ # by a list of numbers delimted by 'x'. This is because of how the underlying launch script
29+ # expects the concurrencies.
30+ bash ./submit_disagg.sh $PREFILL_NODES \
31+ $PREFILL_NUM_WORKERS \
32+ $DECODE_NODES \
33+ $DECODE_NUM_WORKERS \
34+ $N_ADDITIONAL_FRONTENDS \
35+ $ISL $OSL " ${CONC_LIST// / x} " inf \
36+ $GPU_TYPE \
37+ $SCRIPT_MODE
Original file line number Diff line number Diff line change @@ -21,6 +21,7 @@ export TIME_LIMIT="04:00:00"
2121export MODEL_PATH=$MODEL_PATH
2222export CONFIG_DIR=$CONFIG_DIR
2323export CONTAINER_IMAGE=$IMAGE
24+ export GPU_TYPE=" gb200-fp8"
2425
2526# Launch jobs based on ISL/OSL
2627# Replace ' ' in CONC_LIST with 'x' such that the concurrency list is represented
@@ -32,4 +33,5 @@ bash ./submit_disagg.sh $PREFILL_NODES \
3233 $DECODE_NUM_WORKERS \
3334 $N_ADDITIONAL_FRONTENDS \
3435 $ISL $OSL " ${CONC_LIST// / x} " inf \
36+ $GPU_TYPE \
3537 $SCRIPT_MODE
You can’t perform that action at this time.
0 commit comments