### What this PR does / why we need it? - Upgrade to v0.10.0 - Drop v0.9.2 version compatibility - Add patch for `vllm_ascend/patch/worker/patch_common/patch_sampler_gather_logprobs.py` as workaround off3a683b7c9for v0.10.0 and also add e2e test `test_models_prompt_logprobs` - Pin transformers<4.54.0 as workaround of https://github.com/vllm-project/vllm-ascend/issues/2034 ### Does this PR introduce _any_ user-facing change? No ### How was this patch tested? - Test locally: `VLLM_USE_MODELSCOPE=true pytest -sv tests/e2e/singlecard/test_offline_inference.py::test_models_prompt_logprobs` - CI passed - vLLM version: v0.9.2 - vLLM main:7728dd77bb--------- Signed-off-by: Yikun Jiang <yikunkero@gmail.com>
37 lines
982 B
TOML
37 lines
982 B
TOML
[build-system]
|
|
# Should be mirrored in requirements.txt
|
|
requires = [
|
|
"cmake>=3.26",
|
|
"decorator",
|
|
"einops",
|
|
"numpy<2.0.0",
|
|
"packaging",
|
|
"pip",
|
|
"pybind11",
|
|
"pyyaml",
|
|
"scipy",
|
|
"setuptools>=64",
|
|
"setuptools-scm>=8",
|
|
"torch-npu==2.5.1.post1.dev20250619",
|
|
"torch>=2.5.1",
|
|
"torchvision<0.21.0",
|
|
"wheel",
|
|
"msgpack",
|
|
"quart",
|
|
"numba",
|
|
# Remove after https://github.com/vllm-project/vllm-ascend/issues/2034
|
|
"transformers<4.54.0",
|
|
]
|
|
build-backend = "setuptools.build_meta"
|
|
|
|
[tool.pymarkdown]
|
|
plugins.md004.style = "sublist" # ul-style
|
|
plugins.md007.indent = 4 # ul-indent
|
|
plugins.md007.start_indented = true # ul-indent
|
|
plugins.md013.enabled = false # line-length
|
|
plugins.md041.enabled = false # first-line-h1
|
|
plugins.md033.enabled = false # inline-html
|
|
plugins.md046.enabled = false # code-block-style
|
|
plugins.md024.allow_different_nesting = true # no-duplicate-headers
|
|
plugins.md029.enabled = false # ol-prefix
|