We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent ed5867f commit 5b93bc9Copy full SHA for 5b93bc9
2 files changed
.github/configs/amd-master.yaml
@@ -660,7 +660,7 @@ minimaxm2.5-fp4-mi355x-vllm:
660
- { tp: 4, conc-start: 4, conc-end: 64 }
661
662
minimaxm2.5-fp8-mi300x-vllm:
663
- image: vllm/vllm-openai-rocm:v0.16.0
+ image: vllm/vllm-openai-rocm:v0.20.2
664
model: MiniMaxAI/MiniMax-M2.5
665
model-prefix: minimaxm2.5
666
runner: mi300x
perf-changelog.yaml
@@ -2343,3 +2343,9 @@
2343
description:
2344
- "Add Qwen3.5-397B-A17B FP8 MI355X ATOM benchmark configs with and without MTP"
2345
pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1310
2346
+
2347
+- config-keys:
2348
+ - minimaxm2.5-fp8-mi300x-vllm
2349
+ description:
2350
+ - "Update vLLM ROCm image from v0.16.0 to v0.20.2"
2351
+ pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/XXX
0 commit comments