Clean up import vllm in quantization/__init__.py (#4834)
This commit is contained in:
@@ -28,7 +28,7 @@ class TestTritonAttnBackend(CustomTestCase):
|
||||
"triton",
|
||||
"--enable-torch-compile",
|
||||
"--cuda-graph-max-bs",
|
||||
16,
|
||||
4,
|
||||
],
|
||||
)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user