Feat: support cuda graph for LoRA (#4115)
Co-authored-by: Beichen Ma <mabeichen12@gmail.com>
This commit is contained in:
@@ -80,6 +80,7 @@ suites = {
|
||||
TestFile("test_vlm_accuracy.py", 60),
|
||||
TestFile("test_vision_openai_server.py", 637),
|
||||
TestFile("test_w8a8_quantization.py", 46),
|
||||
TestFile("models/lora/test_lora_cuda_graph.py", 250),
|
||||
],
|
||||
"per-commit-2-gpu": [
|
||||
TestFile("models/lora/test_lora_tp.py", 116),
|
||||
|
||||
Reference in New Issue
Block a user