diff --git a/.github/configs/nvidia-master.yaml b/.github/configs/nvidia-master.yaml index 4a58c1676..44082e3e4 100644 --- a/.github/configs/nvidia-master.yaml +++ b/.github/configs/nvidia-master.yaml @@ -2634,7 +2634,7 @@ dsr1-fp8-b200-trt-mtp: - { tp: 8, ep: 1, conc-start: 4, conc-end: 256, spec-decoding: mtp } dsr1-fp8-h200-sglang: - image: lmsysorg/sglang:v0.5.11-cu130 + image: lmsysorg/sglang:v0.5.12-cu130 model: deepseek-ai/DeepSeek-R1-0528 model-prefix: dsr1 runner: h200 diff --git a/perf-changelog.yaml b/perf-changelog.yaml index f8d9c2358..a84672de8 100644 --- a/perf-changelog.yaml +++ b/perf-changelog.yaml @@ -2598,3 +2598,9 @@ description: - "Update vLLM image from v0.20.2 to v0.21.0" pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1399 + +- config-keys: + - dsr1-fp8-h200-sglang + description: + - "Update SGLang image from v0.5.11-cu130 to v0.5.12-cu130" + pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1423