SemiAnalysisAI · Oseltamivir · Apr 26, 2026 · Apr 27, 2026 · Apr 27, 2026 · claude
diff --git a/perf-changelog.yaml b/perf-changelog.yaml
@@ -1886,3 +1886,10 @@
     - "Image pinned to lmsysorg/sglang:deepseek-v4-blackwell@sha256:df18bfc4aa9ecf59451002b49ba00cae58042de9e2a96378bbd21b404dd62c7b"
     - "Adds SGLANG_OPT_* env knobs (SWA_SPLIT_LEAF_ON_INSERT, USE_JIT_NORM, USE_JIT_INDEXER_METADATA, USE_TOPK_V2, USE_CUSTOM_ALL_REDUCE_V2)"
   pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1187
+
+- config-keys:
+    - dsv4-fp4-b300-sglang-mtp
+  description:
+    - "Run evals for DSv4 FP4 B300 SGLang MTP"
+  pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1189
+  evals-only: true
diff --git a/utils/matrix_logic/generate_sweep_configs.py b/utils/matrix_logic/generate_sweep_configs.py
@@ -19,7 +19,7 @@
     "8k1k": (8192, 1024)
 }
 
-MIN_EVAL_CONC = 16
+MIN_EVAL_CONC = 8
 
 # Reverse mapping for exp-name generation
 seq_len_itos = {v: k for k, v in seq_len_stoi.items()}

diff --git a/utils/matrix_logic/test_generate_sweep_configs.py b/utils/matrix_logic/test_generate_sweep_configs.py
@@ -333,7 +333,7 @@ def test_multi_node_eval_conc_uses_only_conc_values_at_or_above_min_conc(self):
         result = mark_eval_entries(matrix_values)
 
         assert result[0]["run-eval"] is True
-        assert result[0]["eval-conc"] == 32
+        assert result[0]["eval-conc"] == 16
         assert result[1]["run-eval"] is False
 
     def test_marks_highest_and_median_conc(self):