[minor] Add server_args check for Llama4 with hybrid (#7988)
This commit is contained in:
@@ -1730,6 +1730,10 @@ class ServerArgs:
|
|||||||
else:
|
else:
|
||||||
self.lora_paths[lora_path] = lora_path
|
self.lora_paths[lora_path] = lora_path
|
||||||
|
|
||||||
|
model_arch = get_model_arch(self)
|
||||||
|
if "Llama4" in model_arch and self.hybrid_kvcache_ratio is not None:
|
||||||
|
assert self.attention_backend == "fa3"
|
||||||
|
|
||||||
|
|
||||||
def prepare_server_args(argv: List[str]) -> ServerArgs:
|
def prepare_server_args(argv: List[str]) -> ServerArgs:
|
||||||
"""
|
"""
|
||||||
|
|||||||
Reference in New Issue
Block a user