[CI] Re-enable sleep mode test and skip failure breaking CI (#990)
### What this PR does / why we need it? - Re-enable sleep mode test - Fix nightly performance benchmark workflow - Fix model-runner-v1 bug for upstream [change](https://github.com/vllm-project/vllm/pull/18654) --------- Signed-off-by: wangli <wangli858794774@gmail.com>
This commit is contained in:
@@ -22,6 +22,7 @@ Run `pytest tests/test_offline_inference.py`.
|
||||
"""
|
||||
import os
|
||||
|
||||
import pytest
|
||||
import vllm # noqa: F401
|
||||
|
||||
from tests.conftest import VllmRunner
|
||||
@@ -46,6 +47,7 @@ def test_models_distributed_QwQ():
|
||||
vllm_model.generate_greedy(example_prompts, max_tokens)
|
||||
|
||||
|
||||
@pytest.mark.skipif(True, reason="wait for mla issue fixed on v1")
|
||||
def test_models_distributed_DeepSeek():
|
||||
example_prompts = [
|
||||
"vLLM is a high-throughput and memory-efficient inference and serving engine for LLMs.",
|
||||
|
||||
Reference in New Issue
Block a user