### What this PR does / why we need it?
Add support for V1 Engine.
Please note that this is just the initial version, and there may be some
places need to be fixed or optimized in the future, feel free to leave
some comments to us.
### Does this PR introduce _any_ user-facing change?
To use V1 Engine on NPU device, you need to set the env variable shown
below:
```bash
export VLLM_USE_V1=1
export VLLM_WORKER_MULTIPROC_METHOD=spawn
```
If you are using vllm for offline inferencing, you must add a `__main__`
guard like:
```bash
if __name__ == '__main__':
llm = vllm.LLM(...)
```
Find more details
[here](https://docs.vllm.ai/en/latest/getting_started/troubleshooting.html#python-multiprocessing).
### How was this patch tested?
I have tested the online serving with `Qwen2.5-7B-Instruct` using this
command:
```bash
vllm serve Qwen/Qwen2.5-7B-Instruct --max_model_len 26240
```
Query the model with input prompts:
```bash
curl http://localhost:8000/v1/completions \
-H "Content-Type: application/json" \
-d '{
"model": "Qwen/Qwen2.5-7B-Instruct",
"prompt": "The future of AI is",
"max_tokens": 7,
"temperature": 0
}'
```
---------
Signed-off-by: shen-shanshan <467638484@qq.com>
Co-authored-by: didongli182 <didongli@huawei.com>
346 lines
11 KiB
Bash
Executable File
346 lines
11 KiB
Bash
Executable File
#!/usr/bin/env bash
|
|
|
|
#
|
|
# Copyright (c) 2025 Huawei Technologies Co., Ltd. All Rights Reserved.
|
|
# This file is a part of the vllm-ascend project.
|
|
# Adapted from https://github.com/vllm-project/vllm/tree/main/tools
|
|
# Copyright 2023 The vLLM team.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
#
|
|
|
|
# YAPF formatter, adapted from ray and skypilot.
|
|
#
|
|
# Usage:
|
|
# # Do work and commit your work.
|
|
|
|
# # Format files that differ from origin/main.
|
|
# bash format.sh
|
|
|
|
# # Commit changed files with message 'Run yapf and ruff'
|
|
#
|
|
#
|
|
# YAPF + Clang formatter (if installed). This script formats all changed files from the last mergebase.
|
|
# You are encouraged to run this locally before pushing changes for review.
|
|
|
|
# Cause the script to exit if a single command fails
|
|
set -eo pipefail
|
|
|
|
# this stops git rev-parse from failing if we run this from the .git directory
|
|
builtin cd "$(dirname "${BASH_SOURCE:-$0}")"
|
|
ROOT="$(git rev-parse --show-toplevel)"
|
|
builtin cd "$ROOT" || exit 1
|
|
|
|
check_command() {
|
|
if ! command -v "$1" &> /dev/null; then
|
|
echo "❓❓$1 is not installed, please run \`pip install -r requirements-lint.txt\`"
|
|
exit 1
|
|
fi
|
|
}
|
|
|
|
check_command yapf
|
|
check_command ruff
|
|
check_command mypy
|
|
check_command codespell
|
|
check_command isort
|
|
check_command clang-format
|
|
|
|
YAPF_VERSION=$(yapf --version | awk '{print $2}')
|
|
RUFF_VERSION=$(ruff --version | awk '{print $2}')
|
|
MYPY_VERSION=$(mypy --version | awk '{print $2}')
|
|
CODESPELL_VERSION=$(codespell --version)
|
|
ISORT_VERSION=$(isort --vn)
|
|
CLANGFORMAT_VERSION=$(clang-format --version | awk '{print $3}')
|
|
SPHINX_LINT_VERSION=$(sphinx-lint --version | awk '{print $2}')
|
|
|
|
# params: tool name, tool version, required version
|
|
tool_version_check() {
|
|
expected=$(grep "$1" requirements-lint.txt | cut -d'=' -f3)
|
|
if [[ "$2" != "$expected" ]]; then
|
|
echo "❓❓Wrong $1 version installed: $expected is required, not $2."
|
|
exit 1
|
|
fi
|
|
}
|
|
|
|
tool_version_check "yapf" "$YAPF_VERSION"
|
|
tool_version_check "ruff" "$RUFF_VERSION"
|
|
tool_version_check "mypy" "$MYPY_VERSION"
|
|
tool_version_check "isort" "$ISORT_VERSION"
|
|
tool_version_check "codespell" "$CODESPELL_VERSION"
|
|
tool_version_check "clang-format" "$CLANGFORMAT_VERSION"
|
|
tool_version_check "sphinx-lint" "$SPHINX_LINT_VERSION"
|
|
|
|
YAPF_FLAGS=(
|
|
'--recursive'
|
|
'--parallel'
|
|
)
|
|
|
|
YAPF_EXCLUDES=(
|
|
'--exclude' 'build/**'
|
|
)
|
|
|
|
# Format specified files
|
|
format() {
|
|
yapf --in-place "${YAPF_FLAGS[@]}" "$@"
|
|
}
|
|
|
|
# Format files that differ from main branch. Ignores dirs that are not slated
|
|
# for autoformat yet.
|
|
format_changed() {
|
|
# The `if` guard ensures that the list of filenames is not empty, which
|
|
# could cause yapf to receive 0 positional arguments, making it hang
|
|
# waiting for STDIN.
|
|
#
|
|
# `diff-filter=ACM` and $MERGEBASE is to ensure we only format files that
|
|
# exist on both branches.
|
|
MERGEBASE="$(git merge-base origin/main HEAD)"
|
|
|
|
if ! git diff --diff-filter=ACM --quiet --exit-code "$MERGEBASE" -- '*.py' '*.pyi' &>/dev/null; then
|
|
git diff --name-only --diff-filter=ACM "$MERGEBASE" -- '*.py' '*.pyi' | xargs -P 5 \
|
|
yapf --in-place "${YAPF_EXCLUDES[@]}" "${YAPF_FLAGS[@]}"
|
|
fi
|
|
}
|
|
|
|
# Format all files
|
|
format_all() {
|
|
yapf --in-place "${YAPF_FLAGS[@]}" "${YAPF_EXCLUDES[@]}" .
|
|
}
|
|
|
|
## This flag formats individual files. --files *must* be the first command line
|
|
## arg to use this option.
|
|
if [[ "$1" == '--files' ]]; then
|
|
format "${@:2}"
|
|
# If `--all` is passed, then any further arguments are ignored and the
|
|
# entire python directory is formatted.
|
|
elif [[ "$1" == '--all' ]]; then
|
|
format_all
|
|
else
|
|
# Format only the files that changed in last commit.
|
|
format_changed
|
|
fi
|
|
echo 'vLLM yapf: Done'
|
|
|
|
# Run mypy
|
|
echo 'vLLM mypy:'
|
|
tools/mypy.sh
|
|
echo 'vLLM mypy: Done'
|
|
|
|
|
|
# If git diff returns a file that is in the skip list, the file may be checked anyway:
|
|
# https://github.com/codespell-project/codespell/issues/1915
|
|
# Avoiding the "./" prefix and using "/**" globs for directories appears to solve the problem
|
|
CODESPELL_EXCLUDES=(
|
|
'--skip' 'tests/prompts/**,./benchmarks/sonnet.txt,*tests/lora/data/**,build/**'
|
|
)
|
|
|
|
CODESPELL_IGNORE_WORDS=(
|
|
'-L' 'CANN,cann,NNAL,nnal,ASCEND,ascend'
|
|
)
|
|
|
|
# check spelling of specified files
|
|
spell_check() {
|
|
codespell "$@" "${CODESPELL_IGNORE_WORDS[@]}"
|
|
}
|
|
|
|
spell_check_all() {
|
|
codespell --toml pyproject.toml "${CODESPELL_EXCLUDES[@]}" "${CODESPELL_IGNORE_WORDS[@]}"
|
|
}
|
|
|
|
# Spelling check of files that differ from main branch.
|
|
spell_check_changed() {
|
|
# The `if` guard ensures that the list of filenames is not empty, which
|
|
# could cause ruff to receive 0 positional arguments, making it hang
|
|
# waiting for STDIN.
|
|
#
|
|
# `diff-filter=ACM` and $MERGEBASE is to ensure we only lint files that
|
|
# exist on both branches.
|
|
MERGEBASE="$(git merge-base origin/main HEAD)"
|
|
if ! git diff --diff-filter=ACM --quiet --exit-code "$MERGEBASE" -- '*.py' '*.pyi' &>/dev/null; then
|
|
git diff --name-only --diff-filter=ACM "$MERGEBASE" -- '*.py' '*.pyi' | xargs \
|
|
codespell "${CODESPELL_EXCLUDES[@]}" "${CODESPELL_IGNORE_WORDS[@]}"
|
|
codespell "${CODESPELL_EXCLUDES[@]}" "${CODESPELL_IGNORE_WORDS[@]}"
|
|
fi
|
|
}
|
|
|
|
# Run Codespell
|
|
## This flag runs spell check of individual files. --files *must* be the first command line
|
|
## arg to use this option.
|
|
if [[ "$1" == '--files' ]]; then
|
|
spell_check "${@:2}"
|
|
# If `--all` is passed, then any further arguments are ignored and the
|
|
# entire python directory is linted.
|
|
elif [[ "$1" == '--all' ]]; then
|
|
spell_check_all
|
|
else
|
|
# Check spelling only of the files that changed in last commit.
|
|
spell_check_changed
|
|
fi
|
|
echo 'vLLM codespell: Done'
|
|
|
|
|
|
# Lint specified files
|
|
lint() {
|
|
ruff check "$@"
|
|
}
|
|
|
|
# Lint files that differ from main branch. Ignores dirs that are not slated
|
|
# for autolint yet.
|
|
lint_changed() {
|
|
# The `if` guard ensures that the list of filenames is not empty, which
|
|
# could cause ruff to receive 0 positional arguments, making it hang
|
|
# waiting for STDIN.
|
|
#
|
|
# `diff-filter=ACM` and $MERGEBASE is to ensure we only lint files that
|
|
# exist on both branches.
|
|
MERGEBASE="$(git merge-base origin/main HEAD)"
|
|
|
|
if ! git diff --diff-filter=ACM --quiet --exit-code "$MERGEBASE" -- '*.py' '*.pyi' &>/dev/null; then
|
|
git diff --name-only --diff-filter=ACM "$MERGEBASE" -- '*.py' '*.pyi' | xargs \
|
|
ruff check
|
|
fi
|
|
|
|
}
|
|
|
|
# Run Ruff
|
|
### This flag lints individual files. --files *must* be the first command line
|
|
### arg to use this option.
|
|
if [[ "$1" == '--files' ]]; then
|
|
lint "${@:2}"
|
|
# If `--all` is passed, then any further arguments are ignored and the
|
|
# entire python directory is linted.
|
|
elif [[ "$1" == '--all' ]]; then
|
|
lint vllm tests
|
|
else
|
|
# Format only the files that changed in last commit.
|
|
lint_changed
|
|
fi
|
|
echo 'vLLM ruff: Done'
|
|
|
|
# check spelling of specified files
|
|
isort_check() {
|
|
isort "$@"
|
|
}
|
|
|
|
isort_check_all(){
|
|
isort .
|
|
}
|
|
|
|
# Spelling check of files that differ from main branch.
|
|
isort_check_changed() {
|
|
# The `if` guard ensures that the list of filenames is not empty, which
|
|
# could cause ruff to receive 0 positional arguments, making it hang
|
|
# waiting for STDIN.
|
|
#
|
|
# `diff-filter=ACM` and $MERGEBASE is to ensure we only lint files that
|
|
# exist on both branches.
|
|
MERGEBASE="$(git merge-base origin/main HEAD)"
|
|
|
|
if ! git diff --diff-filter=ACM --quiet --exit-code "$MERGEBASE" -- '*.py' '*.pyi' &>/dev/null; then
|
|
git diff --name-only --diff-filter=ACM "$MERGEBASE" -- '*.py' '*.pyi' | xargs \
|
|
isort
|
|
fi
|
|
}
|
|
|
|
# Run Isort
|
|
# This flag runs spell check of individual files. --files *must* be the first command line
|
|
# arg to use this option.
|
|
if [[ "$1" == '--files' ]]; then
|
|
isort_check "${@:2}"
|
|
# If `--all` is passed, then any further arguments are ignored and the
|
|
# entire python directory is linted.
|
|
elif [[ "$1" == '--all' ]]; then
|
|
isort_check_all
|
|
else
|
|
# Check spelling only of the files that changed in last commit.
|
|
isort_check_changed
|
|
fi
|
|
echo 'vLLM isort: Done'
|
|
|
|
# Clang-format section
|
|
# Exclude some files for formatting because they are vendored
|
|
# NOTE: Keep up to date with .github/workflows/clang-format.yml
|
|
CLANG_FORMAT_EXCLUDES=(
|
|
'csrc/moe/topk_softmax_kernels.cu'
|
|
'csrc/quantization/gguf/ggml-common.h'
|
|
'csrc/quantization/gguf/dequantize.cuh'
|
|
'csrc/quantization/gguf/vecdotq.cuh'
|
|
'csrc/quantization/gguf/mmq.cuh'
|
|
'csrc/quantization/gguf/mmvq.cuh'
|
|
)
|
|
|
|
# Format specified files with clang-format
|
|
clang_format() {
|
|
clang-format -i "$@"
|
|
}
|
|
|
|
# Format files that differ from main branch with clang-format.
|
|
clang_format_changed() {
|
|
# The `if` guard ensures that the list of filenames is not empty, which
|
|
# could cause clang-format to receive 0 positional arguments, making it hang
|
|
# waiting for STDIN.
|
|
#
|
|
# `diff-filter=ACM` and $MERGEBASE is to ensure we only format files that
|
|
# exist on both branches.
|
|
MERGEBASE="$(git merge-base origin/main HEAD)"
|
|
|
|
# Get the list of changed files, excluding the specified ones
|
|
changed_files=$(git diff --name-only --diff-filter=ACM "$MERGEBASE" -- '*.h' '*.cpp' '*.cu' '*.cuh' | (grep -vFf <(printf "%s\n" "${CLANG_FORMAT_EXCLUDES[@]}") || echo -e))
|
|
if [ -n "$changed_files" ]; then
|
|
echo "$changed_files" | xargs -P 5 clang-format -i
|
|
fi
|
|
}
|
|
|
|
# Format all files with clang-format
|
|
clang_format_all() {
|
|
find csrc/ \( -name '*.h' -o -name '*.cpp' -o -name '*.cu' -o -name '*.cuh' \) -print \
|
|
| grep -vFf <(printf "%s\n" "${CLANG_FORMAT_EXCLUDES[@]}") \
|
|
| xargs clang-format -i
|
|
}
|
|
|
|
# Run clang-format
|
|
if [[ "$1" == '--files' ]]; then
|
|
clang_format "${@:2}"
|
|
elif [[ "$1" == '--all' ]]; then
|
|
clang_format_all
|
|
else
|
|
clang_format_changed
|
|
fi
|
|
echo 'vLLM clang-format: Done'
|
|
|
|
echo 'vLLM actionlint:'
|
|
tools/actionlint.sh -color
|
|
echo 'vLLM actionlint: Done'
|
|
|
|
echo 'vLLM shellcheck:'
|
|
tools/shellcheck.sh
|
|
echo 'vLLM shellcheck: Done'
|
|
|
|
echo 'excalidraw png check:'
|
|
tools/png-lint.sh
|
|
echo 'excalidraw png check: Done'
|
|
|
|
if ! git diff --quiet &>/dev/null; then
|
|
echo
|
|
echo "🔍🔍There are files changed by the format checker or by you that are not added and committed:"
|
|
git --no-pager diff --name-only
|
|
echo "🔍🔍Format checker passed, but please add, commit and push all the files above to include changes made by the format checker."
|
|
|
|
exit 1
|
|
else
|
|
echo "✨🎉 Format check passed! Congratulations! 🎉✨"
|
|
fi
|
|
|
|
# echo 'vLLM sphinx-lint:'
|
|
# tools/sphinx-lint.sh
|
|
# echo 'vLLM sphinx-lint: Done'
|