Support stop_token_ids in sglang API (#1092)
This commit is contained in:
@@ -84,7 +84,7 @@ class TestServingThroughput(unittest.TestCase):
|
||||
|
||||
if os.getenv("SGLANG_IS_IN_CI", "false") == "true":
|
||||
# A100 (PCIE) performance
|
||||
assert res["output_throughput"] > 940
|
||||
assert res["output_throughput"] > 930
|
||||
|
||||
def test_default_with_chunked_prefill(self):
|
||||
res = self.run_test(
|
||||
|
||||
Reference in New Issue
Block a user