[minor] sync code on python/sglang/test/test_deterministic.py and improve ci tests (#11777)
Co-authored-by: Stefan He <hebiaobuaa@gmail.com> Co-authored-by: Byron Hsu <byronhsu1230@gmail.com>
This commit is contained in:
@@ -36,7 +36,6 @@ class TestLMHeadFP32(unittest.TestCase):
|
||||
raise unittest.SkipTest("needs CUDA GPU")
|
||||
|
||||
def _make_logprocessor(self, vocab_size, enable_fp32):
|
||||
ServerArgs.__post_init__ = lambda self: None # disable validation
|
||||
set_global_server_args_for_scheduler(ServerArgs(model_path="dummy"))
|
||||
get_global_server_args().enable_dp_lm_head = False
|
||||
get_global_server_args().enable_fp32_lm_head = enable_fp32
|
||||
|
||||
@@ -66,10 +66,10 @@ suites = {
|
||||
TestFile("rl/test_update_weights_from_disk.py", 114),
|
||||
TestFile("rl/test_update_weights_from_tensor.py", 48),
|
||||
TestFile("test_abort.py", 51),
|
||||
TestFile("test_build_eagle_tree.py", 8),
|
||||
TestFile("test_chunked_prefill.py", 313),
|
||||
TestFile("test_create_kvindices.py", 2),
|
||||
TestFile("test_deterministic.py", 300),
|
||||
TestFile("test_build_eagle_tree.py", 8),
|
||||
TestFile("test_eagle_infer_a.py", 370),
|
||||
TestFile("test_eagle_infer_b.py", 700),
|
||||
TestFile("test_eagle_infer_beta.py", 300),
|
||||
@@ -158,12 +158,17 @@ suites = {
|
||||
TestFile("test_multi_instance_release_memory_occupation.py", 64),
|
||||
TestFile("test_pp_single_node.py", 481),
|
||||
],
|
||||
"per-commit-8-gpu": [
|
||||
"per-commit-8-gpu-h200": [
|
||||
TestFile("lora/test_lora_llama4.py", 400),
|
||||
TestFile("test_deepseek_v3_basic.py", 275),
|
||||
TestFile("test_deepseek_v3_mtp.py", 275),
|
||||
TestFile("test_disaggregation_hybrid_attention.py", 200),
|
||||
],
|
||||
"per-commit-8-gpu-h20": [
|
||||
TestFile("quant/test_w4a8_deepseek_v3.py", 371),
|
||||
TestFile("test_disaggregation_different_tp.py", 600),
|
||||
TestFile("test_disaggregation_pp.py", 140),
|
||||
],
|
||||
"per-commit-4-gpu-b200": [
|
||||
# TestFile("test_gpt_oss_4gpu.py", 600),
|
||||
# TestFile("test_deepseek_v3_fp4_4gpu.py", 3600),
|
||||
@@ -172,17 +177,12 @@ suites = {
|
||||
TestFile("ep/test_deepep_small.py", 531),
|
||||
TestFile("ep/test_mooncake_ep_small.py", 450),
|
||||
],
|
||||
"per-commit-8-gpu-deepep": [
|
||||
"per-commit-8-gpu-h200-deepep": [
|
||||
TestFile("ep/test_deepep_large.py", 338),
|
||||
],
|
||||
"per-commit-8-gpu-deepseek-v32": [
|
||||
"per-commit-8-gpu-h200-deepseek-v32": [
|
||||
TestFile("test_deepseek_v32_basic.py", 275),
|
||||
],
|
||||
"per-commit-8-gpu-h20": [
|
||||
TestFile("test_disaggregation_different_tp.py", 600),
|
||||
TestFile("test_disaggregation_pp.py", 140),
|
||||
TestFile("quant/test_w4a8_deepseek_v3.py", 371),
|
||||
],
|
||||
"vllm_dependency_test": [
|
||||
TestFile("quant/test_awq.py", 163),
|
||||
TestFile("test_bnb.py", 5),
|
||||
|
||||
Reference in New Issue
Block a user