Skip to content

Commit 9ff641e

Browse files
Copilotcquil11
andauthored
Audit and correct required environment variables documentation in all benchmark scripts (#252)
* Initial plan * Update required env vars documentation in all benchmark scripts Co-authored-by: cquil11 <60715037+cquil11@users.noreply.github.com> * Fix required env vars - remove NF, PREFILL_SIZE, and correct PORT/PORT_OFFSET Co-authored-by: cquil11 <60715037+cquil11@users.noreply.github.com> * Remove internally-calculated vars from required env vars (EXTRA_CONFIG_FILE, MAX_NUM_TOKENS, MOE_BACKEND) Co-authored-by: cquil11 <60715037+cquil11@users.noreply.github.com> --------- Co-authored-by: copilot-swe-agent[bot] <198982749+Copilot@users.noreply.github.com> Co-authored-by: cquil11 <60715037+cquil11@users.noreply.github.com>
1 parent a5ebc4a commit 9ff641e

26 files changed

Lines changed: 118 additions & 135 deletions

benchmarks/dsr1_fp4_b200_docker.sh

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,17 @@
11
#!/usr/bin/env bash
22

3+
# === Required Env Vars ===
4+
# MODEL
5+
# PORT
6+
# TP
7+
# CONC
8+
# ISL
9+
# OSL
10+
# RANDOM_RANGE_RATIO
11+
# RESULT_FILENAME
12+
# EP_SIZE
13+
# NUM_PROMPTS
14+
315
nvidia-smi
416

517
# To improve CI stability, we patch this helper function to prevent a race condition that

benchmarks/dsr1_fp4_b200_trt_slurm.sh

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,13 @@
11
#!/usr/bin/env bash
22

3-
# === Required Env Vars ===
4-
# HF_TOKEN
5-
# HF_HUB_CACHE
6-
# IMAGE
3+
# === Required Env Vars ===
74
# MODEL
5+
# TP
6+
# CONC
87
# ISL
98
# OSL
109
# MAX_MODEL_LEN
1110
# RANDOM_RANGE_RATIO
12-
# TP
13-
# CONC
1411
# RESULT_FILENAME
1512
# PORT_OFFSET
1613
# DP_ATTENTION

benchmarks/dsr1_fp4_mi355x_docker.sh

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,14 +1,15 @@
11
#!/usr/bin/env bash
22

3-
# ========= Required Env Vars =========
4-
# HF_TOKEN
5-
# HF_HUB_CACHE
3+
# === Required Env Vars ===
64
# MODEL
7-
# MAX_MODEL_LEN
8-
# RANDOM_RANGE_RATIO
5+
# PORT
96
# TP
107
# CONC
11-
# PORT
8+
# ISL
9+
# OSL
10+
# RANDOM_RANGE_RATIO
11+
# RESULT_FILENAME
12+
# NUM_PROMPTS
1213
export SGLANG_USE_AITER=1
1314

1415
PREFILL_SIZE=196608

benchmarks/dsr1_fp4_mi355x_slurm.sh

Lines changed: 4 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,13 @@
11
#!/usr/bin/env bash
22

3-
# ========= Required Env Vars =========
4-
# HF_TOKEN
5-
# HF_HUB_CACHE
3+
# === Required Env Vars ===
64
# MODEL
5+
# PORT
6+
# TP
7+
# CONC
78
# ISL
89
# OSL
9-
# MAX_MODEL_LEN
1010
# RANDOM_RANGE_RATIO
11-
# TP
12-
# CONC
13-
# PORT
1411
# RESULT_FILENAME
1512
export SGLANG_USE_AITER=1
1613
SERVER_LOG=$(mktemp /tmp/server-XXXXXX.log)

benchmarks/dsr1_fp8_b200_docker.sh

Lines changed: 7 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,13 +1,16 @@
11
#!/usr/bin/env bash
22

3-
# ========= Required Env Vars =========
4-
# HF_TOKEN
5-
# HF_HUB_CACHE
3+
# === Required Env Vars ===
64
# MODEL
75
# PORT
86
# TP
97
# CONC
10-
# MAX_MODEL_LEN
8+
# ISL
9+
# OSL
10+
# RANDOM_RANGE_RATIO
11+
# RESULT_FILENAME
12+
# EP_SIZE
13+
# NUM_PROMPTS
1114

1215
nvidia-smi
1316

benchmarks/dsr1_fp8_b200_trt_slurm.sh

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,13 @@
11
#!/usr/bin/env bash
22

3-
# === Required Env Vars ===
4-
# HF_TOKEN
5-
# HF_HUB_CACHE
6-
# IMAGE
3+
# === Required Env Vars ===
74
# MODEL
5+
# TP
6+
# CONC
87
# ISL
98
# OSL
109
# MAX_MODEL_LEN
1110
# RANDOM_RANGE_RATIO
12-
# TP
13-
# CONC
1411
# RESULT_FILENAME
1512
# PORT_OFFSET
1613
# DP_ATTENTION

benchmarks/dsr1_fp8_h200_slurm.sh

Lines changed: 3 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,12 @@
11
#!/usr/bin/env bash
22

3-
# === Required Env Vars ===
4-
# HF_TOKEN
5-
# HF_HUB_CACHE
6-
# IMAGE
3+
# === Required Env Vars ===
74
# MODEL
5+
# TP
6+
# CONC
87
# ISL
98
# OSL
10-
# MAX_MODEL_LEN
119
# RANDOM_RANGE_RATIO
12-
# TP
13-
# CONC
1410
# RESULT_FILENAME
1511
# PORT_OFFSET
1612

benchmarks/dsr1_fp8_h200_trt_slurm.sh

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,13 @@
11
#!/usr/bin/env bash
22

3-
# === Required Env Vars ===
4-
# HF_TOKEN
5-
# HF_HUB_CACHE
6-
# IMAGE
3+
# === Required Env Vars ===
74
# MODEL
5+
# TP
6+
# CONC
87
# ISL
98
# OSL
109
# MAX_MODEL_LEN
1110
# RANDOM_RANGE_RATIO
12-
# TP
13-
# CONC
1411
# RESULT_FILENAME
1512
# PORT_OFFSET
1613
# DP_ATTENTION

benchmarks/dsr1_fp8_mi300x_docker.sh

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,13 +1,14 @@
11
#!/usr/bin/env bash
22

3-
# ========= Required Env Vars =========
4-
# HF_TOKEN
5-
# HF_HUB_CACHE
3+
# === Required Env Vars ===
64
# MODEL
75
# PORT
86
# TP
97
# CONC
10-
# MAX_MODEL_LEN
8+
# ISL
9+
# OSL
10+
# RANDOM_RANGE_RATIO
11+
# RESULT_FILENAME
1112

1213
# Reference
1314
# https://rocm.docs.amd.com/en/docs-7.0-rc1/preview/benchmark-docker/inference-sglang-deepseek-r1-fp8.html#run-the-inference-benchmark

benchmarks/dsr1_fp8_mi300x_slurm.sh

Lines changed: 3 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,12 @@
11
#!/usr/bin/bash
22

3-
# === Required Env Vars ===
4-
# HF_TOKEN
5-
# HF_HUB_CACHE
6-
# IMAGE
3+
# === Required Env Vars ===
74
# MODEL
5+
# TP
6+
# CONC
87
# ISL
98
# OSL
10-
# MAX_MODEL_LEN
119
# RANDOM_RANGE_RATIO
12-
# TP
13-
# CONC
1410
# RESULT_FILENAME
1511

1612
echo "JOB $SLURM_JOB_ID running on $SLURMD_NODENAME"

0 commit comments

Comments
 (0)