feat: add gpt oss b200 ci (#9988)
This commit is contained in:
@@ -47,8 +47,8 @@ $PIP_CMD install -e "python[dev]" --extra-index-url https://download.pytorch.org
|
|||||||
|
|
||||||
if [ "$IS_BLACKWELL" = "1" ]; then
|
if [ "$IS_BLACKWELL" = "1" ]; then
|
||||||
# TODO auto determine sgl-kernel version
|
# TODO auto determine sgl-kernel version
|
||||||
SGL_KERNEL_VERSION=0.3.2
|
SGL_KERNEL_VERSION=0.3.8
|
||||||
$PIP_CMD install https://github.com/sgl-project/whl/releases/download/v${SGL_KERNEL_VERSION}/sgl_kernel-${SGL_KERNEL_VERSION}-cp39-abi3-manylinux2014_x86_64.whl --force-reinstall $PIP_INSTALL_SUFFIX
|
$PIP_CMD install https://github.com/sgl-project/whl/releases/download/v${SGL_KERNEL_VERSION}/sgl_kernel-${SGL_KERNEL_VERSION}+cu128-cp310-abi3-manylinux2014_x86_64.whl --force-reinstall $PIP_INSTALL_SUFFIX
|
||||||
fi
|
fi
|
||||||
|
|
||||||
# Show current packages
|
# Show current packages
|
||||||
|
|||||||
@@ -139,6 +139,7 @@ suites = {
|
|||||||
],
|
],
|
||||||
"per-commit-8-gpu-b200": [
|
"per-commit-8-gpu-b200": [
|
||||||
# add more here
|
# add more here
|
||||||
|
TestFile("test_gpt_oss_4gpu.py", 600),
|
||||||
],
|
],
|
||||||
"per-commit-4-gpu-deepep": [
|
"per-commit-4-gpu-deepep": [
|
||||||
TestFile("ep/test_deepep_small.py", 531),
|
TestFile("ep/test_deepep_small.py", 531),
|
||||||
|
|||||||
@@ -9,10 +9,7 @@ class TestGptOss4Gpu(BaseTestGptOss):
|
|||||||
model_variant="120b",
|
model_variant="120b",
|
||||||
quantization="bf16",
|
quantization="bf16",
|
||||||
expected_score_of_reasoning_effort={
|
expected_score_of_reasoning_effort={
|
||||||
"low": 0.61,
|
"low": 0.60,
|
||||||
# remove to speed up
|
|
||||||
# "medium": 0.61,
|
|
||||||
# "high": 0.61,
|
|
||||||
},
|
},
|
||||||
other_args=["--tp", "4", "--cuda-graph-max-bs", "200"],
|
other_args=["--tp", "4", "--cuda-graph-max-bs", "200"],
|
||||||
)
|
)
|
||||||
@@ -22,10 +19,7 @@ class TestGptOss4Gpu(BaseTestGptOss):
|
|||||||
model_variant="120b",
|
model_variant="120b",
|
||||||
quantization="mxfp4",
|
quantization="mxfp4",
|
||||||
expected_score_of_reasoning_effort={
|
expected_score_of_reasoning_effort={
|
||||||
"low": 0.61,
|
"low": 0.60,
|
||||||
# remove to speed up
|
|
||||||
# "medium": 0.61,
|
|
||||||
# "high": 0.61,
|
|
||||||
},
|
},
|
||||||
other_args=[
|
other_args=[
|
||||||
"--tp",
|
"--tp",
|
||||||
|
|||||||
Reference in New Issue
Block a user