We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent ed5867f commit cb67e38Copy full SHA for cb67e38
2 files changed
.github/configs/amd-master.yaml
@@ -507,7 +507,7 @@ kimik2.5-int4-mi325x-vllm:
507
- { tp: 8, conc-start: 4, conc-end: 64 }
508
509
kimik2.5-int4-mi300x-vllm:
510
- image: vllm/vllm-openai-rocm:v0.18.0
+ image: vllm/vllm-openai-rocm:v0.20.2
511
model: moonshotai/Kimi-K2.5
512
model-prefix: kimik2.5
513
runner: mi300x
perf-changelog.yaml
@@ -2343,3 +2343,9 @@
2343
description:
2344
- "Add Qwen3.5-397B-A17B FP8 MI355X ATOM benchmark configs with and without MTP"
2345
pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1310
2346
+
2347
+- config-keys:
2348
+ - kimik2.5-int4-mi300x-vllm
2349
+ description:
2350
+ - "Update vLLM ROCm image from v0.18.0 to v0.20.2"
2351
+ pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/XXX
0 commit comments