SemiAnalysisAI · hshrivastava-droid · Apr 15, 2026 · Apr 15, 2026
@@ -2037,7 +2037,7 @@ qwen3.5-fp8-h200-sglang-mtp:
     - { tp: 8, ep: 8, conc-start: 4, conc-end: 128, spec-decoding: mtp }
 
 glm5-fp8-h200-sglang:
-  image: lmsysorg/sglang:glm5-hopper
+  image: lmsysorg/sglang:v0.5.10.post1-cu130
   model: zai-org/GLM-5-FP8
   model-prefix: glm5
   runner: h200

diff --git a/perf-changelog.yaml b/perf-changelog.yaml
@@ -1348,3 +1348,9 @@
   description:
     - "Enable SGLANG_ENABLE_SPEC_V2=1 for Qwen3.5 FP8 H200 SGLang MTP"
   pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1017
+
+- config-keys:
+    - glm5-fp8-h200-sglang
+  description:
+    - "Update SGLang image from glm5-hopper to v0.5.10.post1-cu130"
+  pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1033