Skip to content

Commit 165d41c

Browse files
committed
fix(agentic): normalize Kimi MI355X max context
1 parent 5819b31 commit 165d41c

1 file changed

Lines changed: 6 additions & 3 deletions

File tree

benchmarks/single_node/agentic/kimik2.5_fp4_mi355x.sh

Lines changed: 6 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -23,9 +23,12 @@ ADVANCE_MIN=${ADVANCE_MIN:-0.0}
2323
ADVANCE_MAX=${ADVANCE_MAX:-0.7}
2424
EP_SIZE=${EP_SIZE:-1}
2525
# Kimi-K2.5 advertises a 262144-token context window in vLLM 0.21.0.
26-
# Keep the benchmark loader's trace filter aligned with the server so
27-
# prompt+max_tokens overflows are removed before replay.
28-
MAX_MODEL_LEN=${MAX_MODEL_LEN:-262144}
26+
# Matrix defaults may export MAX_MODEL_LEN=0 to mean "server default"; for this
27+
# script we need the concrete value so AgentX filters prompt+max_tokens against
28+
# the same limit vLLM enforces.
29+
if [[ -z "${MAX_MODEL_LEN:-}" || "$MAX_MODEL_LEN" == "0" ]]; then
30+
MAX_MODEL_LEN=262144
31+
fi
2932

3033
if [[ -n "${SLURM_JOB_ID:-}" ]]; then
3134
echo "JOB $SLURM_JOB_ID running on ${SLURMD_NODENAME:-unknown}"

0 commit comments

Comments
 (0)