diff --git a/test/srt/lora/test_lora_update.py b/test/srt/lora/test_lora_update.py index 5024a9c5d..9afbde79c 100644 --- a/test/srt/lora/test_lora_update.py +++ b/test/srt/lora/test_lora_update.py @@ -229,6 +229,53 @@ BASIC_TESTS = [ ] ), ), + Operation( + type=OperationType.UNLOAD, + data="Nutanix/Meta-Llama-3.1-8B-Instruct_lora_4_alpha_16", + ), + Operation( + type=OperationType.UNLOAD, + data="pbevan11/llama-3.1-8b-ocr-correction", + ), + Operation( + type=OperationType.FORWARD, + data=create_batch_data( + "Nutanix/Meta-Llama-3.1-8B-Instruct_lora_4_alpha_16" + ), + expected_error="not loaded", + ), + Operation( + type=OperationType.FORWARD, + data=create_batch_data("pbevan11/llama-3.1-8b-ocr-correction"), + expected_error="not loaded", + ), + Operation( + type=OperationType.FORWARD, + data=create_batch_data(None), + ), + Operation( + type=OperationType.LOAD, + data="philschmid/code-llama-3-1-8b-text-to-sql-lora", + ), + Operation( + type=OperationType.LOAD, + data="Nutanix/Meta-Llama-3.1-8B-Instruct_lora_4_alpha_16", + ), + Operation( + type=OperationType.LOAD, + data="pbevan11/llama-3.1-8b-ocr-correction", + ), + Operation( + type=OperationType.FORWARD, + data=create_batch_data( + [ + "philschmid/code-llama-3-1-8b-text-to-sql-lora", + "Nutanix/Meta-Llama-3.1-8B-Instruct_lora_4_alpha_16", + "pbevan11/llama-3.1-8b-ocr-correction", + None, + ] + ), + ), ], ), ] @@ -1194,7 +1241,7 @@ class TestLoRADynamicUpdate(CustomTestCase): """ Test dynamic LoRA updates in engine mode. """ - test_cases = ALL_TESTS + test_cases = BASIC_TESTS if is_in_ci() else ALL_TESTS self._run_dynamic_adapter_updates( mode=LoRAUpdateTestSessionMode.ENGINE, test_cases=test_cases, @@ -1204,9 +1251,7 @@ class TestLoRADynamicUpdate(CustomTestCase): """ Test dynamic LoRA updates in server mode. """ - # In CI, we only run the first test case to save time, as the engine test should be mostly sufficient for ensuring correctness. test_cases = BASIC_TESTS if is_in_ci() else ALL_TESTS - self._run_dynamic_adapter_updates( mode=LoRAUpdateTestSessionMode.SERVER, test_cases=test_cases ) diff --git a/test/srt/run_suite.py b/test/srt/run_suite.py index 0eab9537e..dab218994 100644 --- a/test/srt/run_suite.py +++ b/test/srt/run_suite.py @@ -21,7 +21,7 @@ suites = { TestFile("lora/test_lora_backend.py", 99), TestFile("lora/test_multi_lora_backend.py", 60), TestFile("lora/test_lora_cuda_graph.py", 250), - TestFile("lora/test_lora_update.py", 800), + TestFile("lora/test_lora_update.py", 400), TestFile("lora/test_lora_qwen3.py", 97), TestFile("models/test_embedding_models.py", 73), # TestFile("models/test_clip_models.py", 52),