We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 5e2d39e commit 221ea1aCopy full SHA for 221ea1a
1 file changed
benchmarks/gptoss_fp4_h100_docker.sh
@@ -42,7 +42,7 @@ set -x
42
python3 bench_serving/benchmark_serving.py \
43
--model=$MODEL \
44
--backend=vllm \
45
---base-url=\"http://localhost:$PORT\" \
+--base-url=http://localhost:$PORT \
46
--dataset-name=random \
47
--random-input-len=$ISL --random-output-len=$OSL --random-range-ratio=$RANDOM_RANGE_RATIO \
48
--num-prompts=$(( $CONC * 10 )) --max-concurrency=$CONC \
0 commit comments