From 64b7f21ae0c267af8abc1467bb075e0c5fe515fb Mon Sep 17 00:00:00 2001 From: hshrivastava-droid Date: Tue, 23 Jun 2026 23:03:54 -0700 Subject: [PATCH 1/2] Update B300 FP4 SGLang (non-MTP) image to latest nightly Bumps dsv4-fp4-b300-sglang image from lmsysorg/sglang:nightly-dev-cu13-20260529-a8cfae0b to lmsysorg/sglang:nightly-dev-cu13-20260624-b2c8f7a2. --- .github/configs/nvidia-master.yaml | 2 +- perf-changelog.yaml | 6 ++++++ 2 files changed, 7 insertions(+), 1 deletion(-) diff --git a/.github/configs/nvidia-master.yaml b/.github/configs/nvidia-master.yaml index 77833a1b3..b391b7dfe 100644 --- a/.github/configs/nvidia-master.yaml +++ b/.github/configs/nvidia-master.yaml @@ -2004,7 +2004,7 @@ dsr1-fp8-b300-sglang: # DeepSeek-V4-Pro on B300 with sglang (non-MTP). # Uses nightly image with megamoe backend for high-concurrency profiles. dsv4-fp4-b300-sglang: - image: lmsysorg/sglang:nightly-dev-cu13-20260529-a8cfae0b + image: lmsysorg/sglang:nightly-dev-cu13-20260624-b2c8f7a2 model: deepseek-ai/DeepSeek-V4-Pro model-prefix: dsv4 runner: b300 diff --git a/perf-changelog.yaml b/perf-changelog.yaml index d6a5f35e4..2b40fb599 100644 --- a/perf-changelog.yaml +++ b/perf-changelog.yaml @@ -4153,3 +4153,9 @@ - "Run the PR #1891 MiniMax-M3 MXFP8 B300 Dynamo-vLLM recipe set on top of current main." - "Uses the vllm/vllm-openai:minimax-m3-0618-x86_64-cu130 image and the TEP4/TEP8 8k1k topologies not covered by PR #1890." pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1891 + +- config-keys: + - dsv4-fp4-b300-sglang + description: + - "Update B300 FP4 SGLang (non-MTP) image to latest nightly: lmsysorg/sglang:nightly-dev-cu13-20260624-b2c8f7a2 (was nightly-dev-cu13-20260529-a8cfae0b)." + pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/XXX From ab0b672439e821964c28047658c22eb61d61cf2d Mon Sep 17 00:00:00 2001 From: hshrivastava-droid Date: Tue, 23 Jun 2026 23:05:28 -0700 Subject: [PATCH 2/2] Update perf-changelog pr-link for #1913 --- perf-changelog.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/perf-changelog.yaml b/perf-changelog.yaml index 2b40fb599..0f0b40a54 100644 --- a/perf-changelog.yaml +++ b/perf-changelog.yaml @@ -4158,4 +4158,4 @@ - dsv4-fp4-b300-sglang description: - "Update B300 FP4 SGLang (non-MTP) image to latest nightly: lmsysorg/sglang:nightly-dev-cu13-20260624-b2c8f7a2 (was nightly-dev-cu13-20260529-a8cfae0b)." - pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/XXX + pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1913