diff --git a/.github/configs/nvidia-master.yaml b/.github/configs/nvidia-master.yaml index bd9f049a6..e63eba773 100644 --- a/.github/configs/nvidia-master.yaml +++ b/.github/configs/nvidia-master.yaml @@ -2316,7 +2316,7 @@ qwen3.5-fp8-b200-sglang-mtp: qwen3.5-fp8-b300-sglang-mtp: - image: lmsysorg/sglang:v0.5.10.post1-cu130 + image: lmsysorg/sglang:v0.5.11-cu130 model: Qwen/Qwen3.5-397B-A17B-FP8 model-prefix: qwen3.5 runner: b300 diff --git a/perf-changelog.yaml b/perf-changelog.yaml index a8517da6a..1250f809e 100644 --- a/perf-changelog.yaml +++ b/perf-changelog.yaml @@ -2424,3 +2424,9 @@ description: - "Update SGLang image from v0.5.10.post1-cu130 to v0.5.11-cu130" pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1344 + +- config-keys: + - qwen3.5-fp8-b300-sglang-mtp + description: + - "Update SGLang image from v0.5.10.post1-cu130 to v0.5.11-cu130" + pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1346