diff --git a/.github/configs/amd-master.yaml b/.github/configs/amd-master.yaml index aacfd5b3d..aaf912c26 100644 --- a/.github/configs/amd-master.yaml +++ b/.github/configs/amd-master.yaml @@ -802,7 +802,7 @@ minimaxm2.5-fp8-mi300x-vllm-agentic: - { tp: 4, offloading: cpu, conc-list: [16, 20, 24, 28, 32] } minimaxm2.5-fp8-mi325x-vllm: - image: vllm/vllm-openai-rocm:v0.18.0 + image: vllm/vllm-openai-rocm:v0.21.0 model: MiniMaxAI/MiniMax-M2.5 model-prefix: minimaxm2.5 runner: mi325x diff --git a/perf-changelog.yaml b/perf-changelog.yaml index e2f419fd2..85405df4e 100644 --- a/perf-changelog.yaml +++ b/perf-changelog.yaml @@ -2686,3 +2686,9 @@ description: - "Update vLLM ROCm image from v0.18.0 (52d old) to v0.21.0" pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1468 + +- config-keys: + - minimaxm2.5-fp8-mi325x-vllm + description: + - "Update vLLM ROCm image from v0.18.0 (50d old) to v0.21.0" + pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1469