Set csgmv as default lora backend. (#11488)

This commit is contained in:
Lifu Huang
2025-10-15 21:53:24 -07:00
committed by GitHub
parent cbac499750
commit b0d20cdec7
11 changed files with 11 additions and 23 deletions

View File

@@ -44,7 +44,6 @@ class TestLoRARadixCache(CustomTestCase):
torch_dtype = torch.float16
max_new_tokens = 32
backend = "triton"
batch_prompts = (
PROMPTS
if not model_case.skip_long_prompt
@@ -57,7 +56,6 @@ class TestLoRARadixCache(CustomTestCase):
model_case,
torch_dtype,
max_new_tokens=max_new_tokens,
backend=backend,
disable_radix_cache=False,
test_tag="lora-with-radix-cache",
)
@@ -68,7 +66,6 @@ class TestLoRARadixCache(CustomTestCase):
model_case,
torch_dtype,
max_new_tokens=max_new_tokens,
backend=backend,
disable_radix_cache=True,
test_tag="lora-without-radix-cache",
)