From de9217334b28f9a1d9e3ab7c9a249abd4f71730b Mon Sep 17 00:00:00 2001
From: Yineng Zhang <me@zhyncs.com>
Date: Wed, 3 Sep 2025 17:26:38 -0700
Subject: [PATCH] feat: add gpt oss b200 ci (#9988)

---
 scripts/ci/ci_install_dependency.sh |  4 ++--
 test/srt/run_suite.py               |  1 +
 test/srt/test_gpt_oss_4gpu.py       | 10 ++--------
 3 files changed, 5 insertions(+), 10 deletions(-)

diff --git a/scripts/ci/ci_install_dependency.sh b/scripts/ci/ci_install_dependency.sh
index 3f1bae524..95fa01413 100755
--- a/scripts/ci/ci_install_dependency.sh
+++ b/scripts/ci/ci_install_dependency.sh
@@ -47,8 +47,8 @@ $PIP_CMD install -e "python[dev]" --extra-index-url https://download.pytorch.org
 
 if [ "$IS_BLACKWELL" = "1" ]; then
     # TODO auto determine sgl-kernel version
-    SGL_KERNEL_VERSION=0.3.2
-    $PIP_CMD install https://github.com/sgl-project/whl/releases/download/v${SGL_KERNEL_VERSION}/sgl_kernel-${SGL_KERNEL_VERSION}-cp39-abi3-manylinux2014_x86_64.whl --force-reinstall $PIP_INSTALL_SUFFIX
+    SGL_KERNEL_VERSION=0.3.8
+    $PIP_CMD install https://github.com/sgl-project/whl/releases/download/v${SGL_KERNEL_VERSION}/sgl_kernel-${SGL_KERNEL_VERSION}+cu128-cp310-abi3-manylinux2014_x86_64.whl --force-reinstall $PIP_INSTALL_SUFFIX
 fi
 
 # Show current packages
diff --git a/test/srt/run_suite.py b/test/srt/run_suite.py
index 8b4310f43..5b124bb72 100644
--- a/test/srt/run_suite.py
+++ b/test/srt/run_suite.py
@@ -139,6 +139,7 @@ suites = {
     ],
     "per-commit-8-gpu-b200": [
         # add more here
+        TestFile("test_gpt_oss_4gpu.py", 600),
     ],
     "per-commit-4-gpu-deepep": [
         TestFile("ep/test_deepep_small.py", 531),
diff --git a/test/srt/test_gpt_oss_4gpu.py b/test/srt/test_gpt_oss_4gpu.py
index 9dd06225d..da787c6fb 100644
--- a/test/srt/test_gpt_oss_4gpu.py
+++ b/test/srt/test_gpt_oss_4gpu.py
@@ -9,10 +9,7 @@ class TestGptOss4Gpu(BaseTestGptOss):
             model_variant="120b",
             quantization="bf16",
             expected_score_of_reasoning_effort={
-                "low": 0.61,
-                # remove to speed up
-                # "medium": 0.61,
-                # "high": 0.61,
+                "low": 0.60,
             },
             other_args=["--tp", "4", "--cuda-graph-max-bs", "200"],
         )
@@ -22,10 +19,7 @@ class TestGptOss4Gpu(BaseTestGptOss):
             model_variant="120b",
             quantization="mxfp4",
             expected_score_of_reasoning_effort={
-                "low": 0.61,
-                # remove to speed up
-                # "medium": 0.61,
-                # "high": 0.61,
+                "low": 0.60,
             },
             other_args=[
                 "--tp",