From de9217334b28f9a1d9e3ab7c9a249abd4f71730b Mon Sep 17 00:00:00 2001 From: Yineng Zhang Date: Wed, 3 Sep 2025 17:26:38 -0700 Subject: [PATCH] feat: add gpt oss b200 ci (#9988) --- scripts/ci/ci_install_dependency.sh | 4 ++-- test/srt/run_suite.py | 1 + test/srt/test_gpt_oss_4gpu.py | 10 ++-------- 3 files changed, 5 insertions(+), 10 deletions(-) diff --git a/scripts/ci/ci_install_dependency.sh b/scripts/ci/ci_install_dependency.sh index 3f1bae524..95fa01413 100755 --- a/scripts/ci/ci_install_dependency.sh +++ b/scripts/ci/ci_install_dependency.sh @@ -47,8 +47,8 @@ $PIP_CMD install -e "python[dev]" --extra-index-url https://download.pytorch.org if [ "$IS_BLACKWELL" = "1" ]; then # TODO auto determine sgl-kernel version - SGL_KERNEL_VERSION=0.3.2 - $PIP_CMD install https://github.com/sgl-project/whl/releases/download/v${SGL_KERNEL_VERSION}/sgl_kernel-${SGL_KERNEL_VERSION}-cp39-abi3-manylinux2014_x86_64.whl --force-reinstall $PIP_INSTALL_SUFFIX + SGL_KERNEL_VERSION=0.3.8 + $PIP_CMD install https://github.com/sgl-project/whl/releases/download/v${SGL_KERNEL_VERSION}/sgl_kernel-${SGL_KERNEL_VERSION}+cu128-cp310-abi3-manylinux2014_x86_64.whl --force-reinstall $PIP_INSTALL_SUFFIX fi # Show current packages diff --git a/test/srt/run_suite.py b/test/srt/run_suite.py index 8b4310f43..5b124bb72 100644 --- a/test/srt/run_suite.py +++ b/test/srt/run_suite.py @@ -139,6 +139,7 @@ suites = { ], "per-commit-8-gpu-b200": [ # add more here + TestFile("test_gpt_oss_4gpu.py", 600), ], "per-commit-4-gpu-deepep": [ TestFile("ep/test_deepep_small.py", 531), diff --git a/test/srt/test_gpt_oss_4gpu.py b/test/srt/test_gpt_oss_4gpu.py index 9dd06225d..da787c6fb 100644 --- a/test/srt/test_gpt_oss_4gpu.py +++ b/test/srt/test_gpt_oss_4gpu.py @@ -9,10 +9,7 @@ class TestGptOss4Gpu(BaseTestGptOss): model_variant="120b", quantization="bf16", expected_score_of_reasoning_effort={ - "low": 0.61, - # remove to speed up - # "medium": 0.61, - # "high": 0.61, + "low": 0.60, }, other_args=["--tp", "4", "--cuda-graph-max-bs", "200"], ) @@ -22,10 +19,7 @@ class TestGptOss4Gpu(BaseTestGptOss): model_variant="120b", quantization="mxfp4", expected_score_of_reasoning_effort={ - "low": 0.61, - # remove to speed up - # "medium": 0.61, - # "high": 0.61, + "low": 0.60, }, other_args=[ "--tp",