[bugfix][LoRA] Fix the lora accuracy issue introduced by the upstream vLLM changed. (#6958)

### What this PR does / why we need it? Fix the LoRA e2e test accuracy issue that introduced by the upstream PR https://github.com/vllm-project/vllm/pull/32005 ### How was this patch tested? pytest -sv tests/e2e/singlecard/test_llama32_lora.py - vLLM version: v0.16.0 - vLLM main: 15d76f74e2 --------- Signed-off-by: paulyu12 <507435917@qq.com> Signed-off-by: yupeng <507435917@qq.com>
2026-03-10 10:43:18 +08:00
parent a398fa6a0b
commit 40f7d93f1a
2 changed files with 16 additions and 5 deletions
--- a/tests/e2e/singlecard/test_llama32_lora.py
+++ b/tests/e2e/singlecard/test_llama32_lora.py
@@ -3,7 +3,6 @@

 from unittest.mock import patch

-import pytest
 import vllm
 import vllm.config
 from vllm.lora.request import LoRARequest
@@ -126,7 +125,6 @@ def generate_and_test(llm, llama32_lora_files, tensorizer_config_dict: dict | No
    print("removing lora")


-@pytest.mark.skip(reason="fix me")
@patch.dict("os.environ", {"VLLM_USE_MODELSCOPE": "False"})
 def test_llama_lora(llama32_lora_files):
    vllm_model = VllmRunner(