Improve error handling for requests with unloaded LoRA path(s) (#7642)

This commit is contained in:
Lifu Huang
2025-07-01 20:05:34 -07:00
committed by GitHub
parent f18a8fddd4
commit 1a08358aed
3 changed files with 135 additions and 20 deletions

View File

@@ -20,7 +20,7 @@ import logging
import os
import random
import tempfile
from typing import List, Literal, Optional
from typing import List, Literal, Optional, Union
from sglang.srt.hf_transformers_utils import check_gguf_file, get_config
from sglang.srt.reasoning_parser import ReasoningParser
@@ -131,7 +131,7 @@ class ServerArgs:
preferred_sampling_params: Optional[str] = None
# LoRA
lora_paths: Optional[List[str]] = None
lora_paths: Optional[Union[dict[str, str], List[str]]] = None
max_loras_per_batch: int = 8
lora_backend: str = "triton"