Refactor dynamic LoRA update to fix incorrect handling of variant weight shapes (#7844)

2025-07-13 18:36:01 -07:00
parent b5dd5e8741
commit e2ed9d049a
10 changed files with 840 additions and 227 deletions
--- a/python/sglang/test/runners.py
+++ b/python/sglang/test/runners.py
@@ -505,6 +505,8 @@ class SRTRunner:
        torchao_config: Optional[str] = None,
        cuda_graph_max_bs: int = 4,
        sleep_on_idle=False,
+        max_lora_rank: Optional[int] = None,
+        lora_target_modules: Optional[List[str]] = None,
    ):
        self.model_type = model_type
        self.is_generation = model_type == "generation"
@@ -543,6 +545,8 @@ class SRTRunner:
            cuda_graph_max_bs=cuda_graph_max_bs,
            disable_custom_all_reduce=disable_custom_all_reduce,
            sleep_on_idle=sleep_on_idle,
+            max_lora_rank=max_lora_rank,
+            lora_target_modules=lora_target_modules,
            **spec_kwargs,
        )