Support LoRA in bench_serving oai interface (#11318)

2025-10-08 01:28:58 -07:00
parent 6c0bb32711
commit 92473e2e34
1 changed files with 11 additions and 0 deletions
--- a/python/sglang/bench_serving.py
+++ b/python/sglang/bench_serving.py
@@ -209,6 +209,11 @@ async def async_request_openai_completions(
            **request_func_input.extra_request_body,
        }
        # hack to accommodate different LoRA conventions between SGLang and vLLM.
        if request_func_input.lora_name:
            payload["model"] = request_func_input.lora_name
            payload["lora_path"] = request_func_input.lora_name
        if request_func_input.image_data:
            payload.update({"image_data": request_func_input.image_data})
@@ -326,6 +331,12 @@ async def async_request_openai_chat_completions(
            "stream": not args.disable_stream,
            **request_func_input.extra_request_body,
        }
        # hack to accommodate different LoRA conventions between SGLang and vLLM.
        if request_func_input.lora_name:
            payload["model"] = request_func_input.lora_name
            payload["lora_path"] = request_func_input.lora_name
        headers = get_auth_headers()
        output = RequestFuncOutput.init_new(request_func_input)