Skip to content

Commit 1390c52

Browse files
committed
Change to 2 fewshot, forgot eval env var in b200
1 parent 3c8b9bc commit 1390c52

6 files changed

Lines changed: 18 additions & 4 deletions

File tree

benchmarks/benchmark_lib.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -242,7 +242,7 @@ PY
242242
run_lm_eval() {
243243
local port="${PORT:-8888}"
244244
local task="${EVAL_TASK:-gsm8k}"
245-
local num_fewshot="${NUM_FEWSHOT:-5}"
245+
local num_fewshot="${NUM_FEWSHOT:-2}"
246246
local results_dir="${EVAL_RESULT_DIR:-$(mktemp -d /tmp/eval_out-XXXXXX)}"
247247
local gen_max_tokens=4096
248248
local temperature=0

benchmarks/dsr1_fp4_b200_trt_slurm.sh

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -116,3 +116,10 @@ run_benchmark_serving \
116116
--max-concurrency "$CONC" \
117117
--result-filename "$RESULT_FILENAME" \
118118
--result-dir /workspace/
119+
120+
# After throughput, run evaluation only if RUN_EVAL is true
121+
if [ "${RUN_EVAL}" = "true" ]; then
122+
run_eval --framework lm-eval --port "$PORT" --concurrent-requests $(( $CONC * 2 ))
123+
append_lm_eval_summary
124+
fi
125+
set +x

benchmarks/dsr1_fp8_b200_trt_slurm.sh

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -86,3 +86,10 @@ run_benchmark_serving \
8686
--max-concurrency "$CONC" \
8787
--result-filename "$RESULT_FILENAME" \
8888
--result-dir /workspace/
89+
90+
# After throughput, run evaluation only if RUN_EVAL is true
91+
if [ "${RUN_EVAL}" = "true" ]; then
92+
run_eval --framework lm-eval --port "$PORT" --concurrent-requests $(( $CONC * 2 ))
93+
append_lm_eval_summary
94+
fi
95+
set +x

runners/launch_b200-dgxc.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -41,7 +41,7 @@ docker run --rm --init --network host --name $server_name \
4141
-e HF_TOKEN -e HF_HUB_CACHE -e MODEL -e TP -e CONC -e MAX_MODEL_LEN -e ISL -e OSL -e PORT=$PORT -e EP_SIZE -e DP_ATTENTION \
4242
-e NCCL_GRAPH_REGISTER=0 \
4343
-e TORCH_CUDA_ARCH_LIST="10.0" -e CUDA_DEVICE_ORDER=PCI_BUS_ID -e CUDA_VISIBLE_DEVICES="0,1,2,3,4,5,6,7" \
44-
-e PYTHONPYCACHEPREFIX=/tmp/pycache/ -e RESULT_FILENAME -e RANDOM_RANGE_RATIO -e NUM_PROMPTS \
44+
-e PYTHONPYCACHEPREFIX=/tmp/pycache/ -e RESULT_FILENAME -e RANDOM_RANGE_RATIO -e NUM_PROMPTS -e RUN_EVAL \
4545
--entrypoint=/bin/bash \
4646
$(echo "$IMAGE" | sed 's/#/\//') \
4747
benchmarks/"${EXP_NAME%%_*}_${PRECISION}_b200${FRAMEWORK_SUFFIX}_docker.sh"

runners/launch_b200-nb.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,4 +12,4 @@ srun --partition=$PARTITION --gres=gpu:$TP --exclusive \
1212
--no-container-mount-home --container-writable \
1313
--container-workdir=/workspace/ \
1414
--no-container-entrypoint --export=ALL,PORT_OFFSET=${USER: -1} \
15-
bash benchmarks/${EXP_NAME%%_*}_${PRECISION}_b200${FRAMEWORK_SUFFIX}_slurm.sh
15+
bash benchmarks/${EXP_NAME%%_*}_${PRECISION}_b200${FRAMEWORK_SUFFIX}_slurm.sh

runners/launch_b200-nvd.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,7 @@ docker run --rm --init --network host --name $server_name \
4242
-e HF_TOKEN -e HF_HUB_CACHE -e MODEL -e TP -e CONC -e MAX_MODEL_LEN -e ISL -e OSL -e PORT=$PORT -e EP_SIZE -e DP_ATTENTION \
4343
-e NCCL_GRAPH_REGISTER=0 \
4444
-e TORCH_CUDA_ARCH_LIST="10.0" -e CUDA_DEVICE_ORDER=PCI_BUS_ID -e CUDA_VISIBLE_DEVICES="0,1,2,3,4,5,6,7" \
45-
-e PYTHONPYCACHEPREFIX=/tmp/pycache/ -e RESULT_FILENAME -e RANDOM_RANGE_RATIO -e NUM_PROMPTS \
45+
-e PYTHONPYCACHEPREFIX=/tmp/pycache/ -e RESULT_FILENAME -e RANDOM_RANGE_RATIO -e NUM_PROMPTS -e RUN_EVAL \
4646
--entrypoint=/bin/bash \
4747
$(echo "$IMAGE" | sed 's/#/\//') \
4848
benchmarks/"${EXP_NAME%%_*}_${PRECISION}_b200${FRAMEWORK_SUFFIX}_docker.sh"

0 commit comments

Comments
 (0)