[V1][LoRA][Test] V1 Engine LoRA support & e2e test (#893)

### What this PR does / why we need it? Add V1Engine LoRA support. Add LoRA e2e test on single card and multiple cards. ### Does this PR introduce _any_ user-facing change? support lora for V1 ### How was this patch tested? CI passed with new added test --------- Signed-off-by: jesse <szxfml@gmail.com> Signed-off-by: paulyu <paulyu0307@gmail.com> Signed-off-by: paulyu12 <507435917@qq.com> Co-authored-by: jesse <szxfml@gmail.com> Co-authored-by: paulyu <paulyu0307@gmail.com>
2025-05-22 19:20:51 +08:00
parent 7aa4f85f10
commit 0f53b138f6
6 changed files with 167 additions and 38 deletions
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -23,6 +23,7 @@ from typing import List, Optional, Tuple, TypeVar, Union
 import numpy as np
 import pytest
 import torch
+from huggingface_hub import snapshot_download
 from PIL import Image
 from vllm import LLM, SamplingParams
 from vllm.config import TaskOption
@@ -348,4 +349,9 @@ def vllm_runner():

@pytest.fixture(params=list(PROMPT_TEMPLATES.keys()))
 def prompt_template(request):
-    return PROMPT_TEMPLATES[request.param]
+    return PROMPT_TEMPLATES[request.param]
+
+
+@pytest.fixture(scope="session")
+def ilama_lora_files():
+    return snapshot_download(repo_id="jeeejeee/ilama-text2sql-spider")