Disable radix cache in test_lora_update.py for better stability (#9852)

This commit is contained in:
Baizhou Zhang
2025-08-31 22:28:22 -07:00
committed by GitHub
parent 8c2ffaaf0f
commit 7de2ce45b2

View File

@@ -824,6 +824,7 @@ class LoRAUpdateEngineTestSession(LoRAUpdateTestSessionBase):
disable_cuda_graph=self.disable_cuda_graph,
cuda_graph_max_bs=self.cuda_graph_max_bs,
enable_lora=self.enable_lora,
disable_radix_cache=True,
)
self.handle.__enter__()
return self
@@ -958,6 +959,7 @@ class LoRAUpdateServerTestSession(LoRAUpdateTestSessionBase):
"1",
"--mem-fraction-static",
str(MEM_FRACTION_STATIC),
"--disable-radix-cache",
]
if self.enable_lora:
other_args.append("--enable-lora")