Improve profiler and integrate profiler in bench_one_batch_server (#6787)
This commit is contained in:
@@ -11,6 +11,7 @@ from sglang.test.test_utils import (
|
||||
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH,
|
||||
DEFAULT_URL_FOR_TEST,
|
||||
CustomTestCase,
|
||||
is_in_amd_ci,
|
||||
popen_launch_server,
|
||||
)
|
||||
|
||||
@@ -68,7 +69,11 @@ class TestTorchCompile(CustomTestCase):
|
||||
print(f"{res=}")
|
||||
throughput = max_tokens / (tok - tic)
|
||||
print(f"Throughput: {throughput} tokens/s")
|
||||
self.assertGreaterEqual(throughput, 152)
|
||||
|
||||
if is_in_amd_ci():
|
||||
self.assertGreaterEqual(throughput, 145)
|
||||
else:
|
||||
self.assertGreaterEqual(throughput, 152)
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
|
||||
Reference in New Issue
Block a user