File tree Expand file tree Collapse file tree
benchmarks/single_node/agentic Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -23,9 +23,12 @@ ADVANCE_MIN=${ADVANCE_MIN:-0.0}
2323ADVANCE_MAX=${ADVANCE_MAX:- 0.7}
2424EP_SIZE=${EP_SIZE:- 1}
2525# Kimi-K2.5 advertises a 262144-token context window in vLLM 0.21.0.
26- # Keep the benchmark loader's trace filter aligned with the server so
27- # prompt+max_tokens overflows are removed before replay.
28- MAX_MODEL_LEN=${MAX_MODEL_LEN:- 262144}
26+ # Matrix defaults may export MAX_MODEL_LEN=0 to mean "server default"; for this
27+ # script we need the concrete value so AgentX filters prompt+max_tokens against
28+ # the same limit vLLM enforces.
29+ if [[ -z " ${MAX_MODEL_LEN:- } " || " $MAX_MODEL_LEN " == " 0" ]]; then
30+ MAX_MODEL_LEN=262144
31+ fi
2932
3033if [[ -n " ${SLURM_JOB_ID:- } " ]]; then
3134 echo " JOB $SLURM_JOB_ID running on ${SLURMD_NODENAME:- unknown} "
You can’t perform that action at this time.
0 commit comments