Skip to content

Commit 5b67fb0

Browse files
committed
b200 test
1 parent 822521f commit 5b67fb0

2 files changed

Lines changed: 6 additions & 4 deletions

File tree

.github/workflows/eval-gms8k.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -49,10 +49,10 @@ jobs:
4949
uses: ./.github/workflows/eval-tmpl.yml
5050
secrets: inherit
5151
with:
52-
runner: b200-nvd_2
53-
image: ${{ inputs.image || 'nvcr.io#nvidia/tensorrt-llm/release:1.2.0rc0.post1' }}
52+
runner: b200-nvd_3
53+
image: ${{ inputs.image || 'vllm/vllm-openai:v0.11.0' }}
5454
model: ${{ inputs.model || 'openai/gpt-oss-120b' }}
55-
framework: trt
55+
framework: vllm
5656
precision: fp4
5757
exp-name: ${{ inputs.exp-name || 'gptoss_gsm8k_poc' }}
5858
tp: '4'

benchmarks/gptoss_fp4_b200_docker.sh

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -79,7 +79,9 @@ run_benchmark_serving \
7979

8080
# After throughput, run evaluation only if RUN_EVAL is true
8181
if [ "${RUN_EVAL}" = "true" ]; then
82-
run_eval --framework lm-eval --port "$PORT" --concurrent-requests $(( $CONC * 2 ))
82+
run_eval --framework lm-eval --port "$PORT" --concurrent-requests $(( $CONC * 2 )) --results-dir /workspace/
8383
append_lm_eval_summary
8484
fi
85+
86+
ls -lt /workspace/
8587
set +x

0 commit comments

Comments
 (0)