We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent c353742 commit f9aafa9Copy full SHA for f9aafa9
2 files changed
.github/configs/amd-master.yaml
@@ -801,7 +801,7 @@ kimik2.5-int4-mi300x-vllm:
801
- { tp: 8, conc-start: 4, conc-end: 64 }
802
803
kimik2.5-fp4-mi355x-vllm:
804
- image: vllm/vllm-openai-rocm:v0.21.0
+ image: vllm/vllm-openai-rocm:v0.22.0
805
model: amd/Kimi-K2.5-MXFP4
806
model-prefix: kimik2.5
807
runner: mi355x
perf-changelog.yaml
@@ -3329,3 +3329,9 @@
3329
description:
3330
- "Update vLLM ROCm image from nightly-4f940896a32c9e2a0eba7f50d521bf5f6b4de458 to v0.22.0"
3331
pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1624
3332
+
3333
+- config-keys:
3334
+ - kimik2.5-fp4-mi355x-vllm
3335
+ description:
3336
+ - "Update vLLM ROCm image from v0.21.0 to v0.22.0"
3337
+ pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1616
0 commit comments