[Bugfix] Fix structured outputs errors: TypeError: apply_token_bitmask_inplace_cpu() (#6151)
### What this PR does / why we need it?
Fix https://github.com/vllm-project/vllm-ascend/issues/5524
- vLLM version: v0.13.0
- vLLM main:
d68209402d
Signed-off-by: wjunLu <wjunlu217@gmail.com>
This commit is contained in:
3
.github/workflows/_e2e_test.yaml
vendored
3
.github/workflows/_e2e_test.yaml
vendored
@@ -99,8 +99,7 @@ jobs:
|
|||||||
pytest -sv --durations=0 tests/e2e/singlecard/test_camem.py
|
pytest -sv --durations=0 tests/e2e/singlecard/test_camem.py
|
||||||
pytest -sv --durations=0 tests/e2e/singlecard/test_completion_with_prompt_embeds.py
|
pytest -sv --durations=0 tests/e2e/singlecard/test_completion_with_prompt_embeds.py
|
||||||
pytest -sv --durations=0 tests/e2e/singlecard/test_cpu_offloading.py
|
pytest -sv --durations=0 tests/e2e/singlecard/test_cpu_offloading.py
|
||||||
# xgrammar has parameter mismatching bug, please follows: https://github.com/vllm-project/vllm-ascend/issues/5524
|
pytest -sv --durations=0 tests/e2e/singlecard/test_guided_decoding.py
|
||||||
# pytest -sv --durations=0 tests/e2e/singlecard/test_guided_decoding.py
|
|
||||||
pytest -sv --durations=0 tests/e2e/singlecard/test_ilama_lora.py
|
pytest -sv --durations=0 tests/e2e/singlecard/test_ilama_lora.py
|
||||||
pytest -sv --durations=0 tests/e2e/singlecard/test_llama32_lora.py
|
pytest -sv --durations=0 tests/e2e/singlecard/test_llama32_lora.py
|
||||||
pytest -sv --durations=0 tests/e2e/singlecard/test_qwen3_multi_loras.py
|
pytest -sv --durations=0 tests/e2e/singlecard/test_qwen3_multi_loras.py
|
||||||
|
|||||||
@@ -25,6 +25,7 @@ requires = [
|
|||||||
"msgpack",
|
"msgpack",
|
||||||
"quart",
|
"quart",
|
||||||
"numba",
|
"numba",
|
||||||
|
"xgrammar>=0.1.30",
|
||||||
"fastapi<0.124.0",
|
"fastapi<0.124.0",
|
||||||
"opencv-python-headless<=4.11.0.86", # Required to avoid numpy version conflict with vllm
|
"opencv-python-headless<=4.11.0.86", # Required to avoid numpy version conflict with vllm
|
||||||
"compressed_tensors>=0.11.0",
|
"compressed_tensors>=0.11.0",
|
||||||
|
|||||||
@@ -14,6 +14,7 @@ setuptools-scm>=8
|
|||||||
torch==2.9.0
|
torch==2.9.0
|
||||||
torchvision
|
torchvision
|
||||||
wheel
|
wheel
|
||||||
|
xgrammar>=0.1.30
|
||||||
pandas-stubs
|
pandas-stubs
|
||||||
opencv-python-headless<=4.11.0.86 # Required to avoid numpy version conflict with vllm
|
opencv-python-headless<=4.11.0.86 # Required to avoid numpy version conflict with vllm
|
||||||
compressed_tensors>=0.11.0
|
compressed_tensors>=0.11.0
|
||||||
|
|||||||
Reference in New Issue
Block a user