Deprecate --disable-flashinfer and --disable-flashinfer-sampling (#2065)

This commit is contained in:
Lianmin Zheng
2024-11-17 16:20:58 -08:00
committed by GitHub
parent 38625e2139
commit 11f881d173
3 changed files with 25 additions and 28 deletions

View File

@@ -65,8 +65,7 @@ class TestTorchCompile(unittest.TestCase):
tok = time.time()
print(f"{res=}")
throughput = max_tokens / (tok - tic)
print(f"Throughput: {throughput} tokens/s")
self.assertGreaterEqual(throughput, 290)
self.assertGreaterEqual(throughput, 285)
if __name__ == "__main__":