update unit test (#3636)
This commit is contained in:
2
.github/workflows/pr-test.yml
vendored
2
.github/workflows/pr-test.yml
vendored
@@ -107,6 +107,8 @@ jobs:
|
|||||||
bash scripts/ci_install_dependency.sh
|
bash scripts/ci_install_dependency.sh
|
||||||
|
|
||||||
- name: Run test
|
- name: Run test
|
||||||
|
env:
|
||||||
|
HF_TOKEN: ${{ secrets.HF_TOKEN }}
|
||||||
timeout-minutes: 30
|
timeout-minutes: 30
|
||||||
run: |
|
run: |
|
||||||
RANGE=${{ matrix.range }}
|
RANGE=${{ matrix.range }}
|
||||||
|
|||||||
@@ -21,11 +21,11 @@ suites = {
|
|||||||
"test_eval_accuracy_mini.py",
|
"test_eval_accuracy_mini.py",
|
||||||
"test_gguf.py",
|
"test_gguf.py",
|
||||||
"test_input_embeddings.py",
|
"test_input_embeddings.py",
|
||||||
|
"test_mla.py",
|
||||||
|
"test_mla_fp8.py",
|
||||||
"test_json_constrained.py",
|
"test_json_constrained.py",
|
||||||
"test_large_max_new_tokens.py",
|
"test_large_max_new_tokens.py",
|
||||||
"test_metrics.py",
|
"test_metrics.py",
|
||||||
"test_mla.py",
|
|
||||||
"test_mla_fp8.py",
|
|
||||||
"test_no_chunked_prefill.py",
|
"test_no_chunked_prefill.py",
|
||||||
"test_no_overlap_scheduler.py",
|
"test_no_overlap_scheduler.py",
|
||||||
"test_openai_server.py",
|
"test_openai_server.py",
|
||||||
|
|||||||
@@ -58,7 +58,7 @@ class TestMLA(unittest.TestCase):
|
|||||||
class TestDeepseekV3(unittest.TestCase):
|
class TestDeepseekV3(unittest.TestCase):
|
||||||
@classmethod
|
@classmethod
|
||||||
def setUpClass(cls):
|
def setUpClass(cls):
|
||||||
cls.model = "lmzheng/sglang-ci-dsv3-test"
|
cls.model = "sgl-project/sglang-ci-dsv3-test"
|
||||||
cls.base_url = DEFAULT_URL_FOR_TEST
|
cls.base_url = DEFAULT_URL_FOR_TEST
|
||||||
other_args = ["--trust-remote-code"]
|
other_args = ["--trust-remote-code"]
|
||||||
if torch.cuda.is_available() and torch.version.cuda:
|
if torch.cuda.is_available() and torch.version.cuda:
|
||||||
@@ -93,13 +93,12 @@ class TestDeepseekV3(unittest.TestCase):
|
|||||||
class TestDeepseekV3MTP(unittest.TestCase):
|
class TestDeepseekV3MTP(unittest.TestCase):
|
||||||
@classmethod
|
@classmethod
|
||||||
def setUpClass(cls):
|
def setUpClass(cls):
|
||||||
cls.model = "lmzheng/sglang-ci-dsv3-test"
|
cls.model = "sgl-project/sglang-ci-dsv3-test"
|
||||||
cls.base_url = DEFAULT_URL_FOR_TEST
|
cls.base_url = DEFAULT_URL_FOR_TEST
|
||||||
other_args = ["--trust-remote-code"]
|
other_args = ["--trust-remote-code"]
|
||||||
if torch.cuda.is_available() and torch.version.cuda:
|
if torch.cuda.is_available() and torch.version.cuda:
|
||||||
other_args.extend(
|
other_args.extend(
|
||||||
[
|
[
|
||||||
"--enable-torch-compile",
|
|
||||||
"--cuda-graph-max-bs",
|
"--cuda-graph-max-bs",
|
||||||
"2",
|
"2",
|
||||||
"--disable-radix",
|
"--disable-radix",
|
||||||
@@ -109,7 +108,7 @@ class TestDeepseekV3MTP(unittest.TestCase):
|
|||||||
"--speculative-algorithm",
|
"--speculative-algorithm",
|
||||||
"NEXTN",
|
"NEXTN",
|
||||||
"--speculative-draft",
|
"--speculative-draft",
|
||||||
"SGLang/sglang-ci-dsv3-test-NextN",
|
"sgl-project/sglang-ci-dsv3-test-NextN",
|
||||||
"--speculative-num-steps",
|
"--speculative-num-steps",
|
||||||
"2",
|
"2",
|
||||||
"--speculative-eagle-topk",
|
"--speculative-eagle-topk",
|
||||||
|
|||||||
Reference in New Issue
Block a user