Improve profiler and integrate profiler in bench_one_batch_server (#6787)
This commit is contained in:
@@ -1,4 +1,3 @@
|
||||
import os
|
||||
import unittest
|
||||
from types import SimpleNamespace
|
||||
|
||||
@@ -11,6 +10,7 @@ from sglang.test.test_utils import (
|
||||
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH,
|
||||
DEFAULT_URL_FOR_TEST,
|
||||
CustomTestCase,
|
||||
is_in_amd_ci,
|
||||
is_in_ci,
|
||||
popen_launch_server,
|
||||
write_github_step_summary,
|
||||
@@ -67,7 +67,7 @@ class TestDeepseekV3(CustomTestCase):
|
||||
write_github_step_summary(
|
||||
f"### test_bs_1_speed (deepseek-v3)\n" f"{speed=:.2f} token/s\n"
|
||||
)
|
||||
if os.getenv("SGLANG_AMD_CI") == "1":
|
||||
if is_in_amd_ci():
|
||||
self.assertGreater(speed, 12)
|
||||
else:
|
||||
self.assertGreater(speed, 75)
|
||||
@@ -91,7 +91,7 @@ class TestDeepseekV3MTP(CustomTestCase):
|
||||
"--speculative-num-draft-tokens",
|
||||
"4",
|
||||
]
|
||||
if os.environ.get("SGLANG_AMD_CI") != "1":
|
||||
if not is_in_amd_ci():
|
||||
other_args += ["--mem-frac", "0.7"]
|
||||
cls.process = popen_launch_server(
|
||||
cls.model,
|
||||
@@ -148,11 +148,11 @@ class TestDeepseekV3MTP(CustomTestCase):
|
||||
f"{acc_length=:.2f}\n"
|
||||
f"{speed=:.2f} token/s\n"
|
||||
)
|
||||
if os.getenv("SGLANG_AMD_CI") == "1":
|
||||
if is_in_amd_ci():
|
||||
self.assertGreater(acc_length, 2.8)
|
||||
else:
|
||||
self.assertGreater(acc_length, 2.9)
|
||||
if os.getenv("SGLANG_AMD_CI") == "1":
|
||||
if is_in_amd_ci():
|
||||
self.assertGreater(speed, 15)
|
||||
else:
|
||||
self.assertGreater(speed, 105)
|
||||
|
||||
Reference in New Issue
Block a user