Fix test of flashinfer mla with nextn (#4237)
This commit is contained in:
@@ -121,7 +121,7 @@ class TestFlashinferMLAMTP(unittest.TestCase):
|
|||||||
"--speculative-draft",
|
"--speculative-draft",
|
||||||
"lmsys/sglang-ci-dsv3-test-NextN",
|
"lmsys/sglang-ci-dsv3-test-NextN",
|
||||||
"--speculative-num-steps",
|
"--speculative-num-steps",
|
||||||
"4",
|
"3",
|
||||||
"--speculative-eagle-topk",
|
"--speculative-eagle-topk",
|
||||||
"1",
|
"1",
|
||||||
"--speculative-num-draft-tokens",
|
"--speculative-num-draft-tokens",
|
||||||
|
|||||||
Reference in New Issue
Block a user