Signed-off-by: Alex Chi Z <iskyzh@gmail.com> Co-authored-by: Baizhou Zhang <sobereddiezhang@gmail.com>
71 lines
1.7 KiB
Python
71 lines
1.7 KiB
Python
"""
|
|
Usage:
|
|
cd test/srt
|
|
python3 -m unittest test_deterministic.TestDeterministic.TESTCASE
|
|
|
|
Note that there is also `python/sglang/test/test_deterministic.py` as an interactive test. We are converting that
|
|
test into unit tests so that's easily reproducible in CI.
|
|
"""
|
|
|
|
import unittest
|
|
|
|
from sglang.srt.utils import kill_process_tree
|
|
from sglang.test.test_deterministic import BenchArgs, test_deterministic
|
|
from sglang.test.test_deterministic_utils import (
|
|
COMMON_SERVER_ARGS,
|
|
DEFAULT_MODEL,
|
|
TestDeterministicBase,
|
|
)
|
|
from sglang.test.test_utils import (
|
|
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH,
|
|
DEFAULT_URL_FOR_TEST,
|
|
CustomTestCase,
|
|
popen_launch_server,
|
|
)
|
|
|
|
|
|
class TestFlashinferDeterministic(TestDeterministicBase):
|
|
# Test with flashinfer attention backend
|
|
@classmethod
|
|
def get_server_args(cls):
|
|
args = COMMON_SERVER_ARGS
|
|
args.extend(
|
|
[
|
|
"--attention-backend",
|
|
"flashinfer",
|
|
]
|
|
)
|
|
return args
|
|
|
|
|
|
class TestFa3Deterministic(TestDeterministicBase):
|
|
# Test with fa3 attention backend
|
|
@classmethod
|
|
def get_server_args(cls):
|
|
args = COMMON_SERVER_ARGS
|
|
args.extend(
|
|
[
|
|
"--attention-backend",
|
|
"fa3",
|
|
]
|
|
)
|
|
return args
|
|
|
|
|
|
class TestTritonDeterministic(TestDeterministicBase):
|
|
# Test with triton attention backend
|
|
@classmethod
|
|
def get_server_args(cls):
|
|
args = COMMON_SERVER_ARGS
|
|
args.extend(
|
|
[
|
|
"--attention-backend",
|
|
"triton",
|
|
]
|
|
)
|
|
return args
|
|
|
|
|
|
if __name__ == "__main__":
|
|
unittest.main()
|