diff --git a/.github/configs/nvidia-master.yaml b/.github/configs/nvidia-master.yaml index b8db07e0d..5bf3c53a4 100644 --- a/.github/configs/nvidia-master.yaml +++ b/.github/configs/nvidia-master.yaml @@ -9067,7 +9067,7 @@ glm5-fp8-b200-dynamo-sglang: # MTP variant of dsv4-fp4-gb300-dynamo-sglang. dsv4-fp4-gb300-dynamo-sglang-mtp: - image: lmsysorg/sglang:nightly-dev-cu13-20260509-9ee83034 + image: lmsysorg/sglang:nightly-dev-20260527-14f81a67 model: deepseek-ai/DeepSeek-V4-Pro model-prefix: dsv4 runner: gb300-cw diff --git a/perf-changelog.yaml b/perf-changelog.yaml index 28523da86..e8463939f 100644 --- a/perf-changelog.yaml +++ b/perf-changelog.yaml @@ -3404,6 +3404,13 @@ - "Add DeepSeek-V4-Pro FP4 MI355X ATOM MTP3 benchmark; image rocm/atom:rocm7.2.4_ubuntu24.04_py3.12_pytorch_release_2.10.0_atom0.1.3" pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1627 +- config-keys: + - dsv4-fp4-gb300-dynamo-sglang-mtp + description: + - "Update SGLang image from nightly-dev-cu13-20260509-9ee83034 to nightly-dev-20260527-14f81a67" + pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1637 + + - config-keys: - minimaxm2.5-fp4-gb200-dynamo-vllm description: