From 91f7d8115dd3bab76974e22cbd3df13cacb9f8f3 Mon Sep 17 00:00:00 2001 From: Mengqing Cao Date: Fri, 7 Mar 2025 20:34:07 +0800 Subject: [PATCH] [CI/Build] Bump torch_npu to dev20250307.3 (#265) Update torch-npu version to fix torch npu exponential_ accuracy With this update, the percision issue when setting `temperature > 0` is fixed. --------- Signed-off-by: Mengqing Cao --- .github/workflows/vllm_ascend_test.yaml | 4 ++-- README.md | 2 +- README.zh.md | 2 +- docs/source/installation.md | 12 ++++++------ docs/source/tutorials.md | 6 ++++-- pta_install.sh | 6 +++--- 6 files changed, 17 insertions(+), 15 deletions(-) diff --git a/.github/workflows/vllm_ascend_test.yaml b/.github/workflows/vllm_ascend_test.yaml index ea3d673..7b1d773 100644 --- a/.github/workflows/vllm_ascend_test.yaml +++ b/.github/workflows/vllm_ascend_test.yaml @@ -133,9 +133,9 @@ jobs: run: | mkdir pta cd pta - wget https://pytorch-package.obs.cn-north-4.myhuaweicloud.com/pta/Daily/v2.5.1/20250226.4/pytorch_v2.5.1_py310.tar.gz + wget https://pytorch-package.obs.cn-north-4.myhuaweicloud.com/pta/Daily/v2.5.1/20250307.3/pytorch_v2.5.1_py310.tar.gz tar -xvf pytorch_v2.5.1_py310.tar.gz - pip install ./torch_npu-2.5.1.dev20250226-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl + pip install ./torch_npu-2.5.1.dev20250307-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl cd .. rm -rf pta diff --git a/README.md b/README.md index 16e7401..fa93fa8 100644 --- a/README.md +++ b/README.md @@ -36,7 +36,7 @@ By using vLLM Ascend plugin, popular open-source models, including Transformer-l - Software: * Python >= 3.9 * CANN >= 8.0.0 - * PyTorch >= 2.5.1, torch-npu >= 2.5.1.dev20250226 + * PyTorch >= 2.5.1, torch-npu >= 2.5.1.dev20250307 * vLLM (the same version as vllm-ascend) Find more about how to setup your environment step by step in [here](docs/source/installation.md). diff --git a/README.zh.md b/README.zh.md index 669f629..a4f3beb 100644 --- a/README.zh.md +++ b/README.zh.md @@ -36,7 +36,7 @@ vLLM 昇腾插件 (`vllm-ascend`) 是一个让vLLM在Ascend NPU无缝运行的 - 软件: * Python >= 3.9 * CANN >= 8.0.RC2 - * PyTorch >= 2.5.1, torch-npu >= 2.5.1.dev20250226 + * PyTorch >= 2.5.1, torch-npu >= 2.5.1.dev20250307 * vLLM (与vllm-ascend版本一致) 在[此处](docs/source/installation.md),您可以了解如何逐步准备环境。 diff --git a/docs/source/installation.md b/docs/source/installation.md index 78c54be..beb8efc 100644 --- a/docs/source/installation.md +++ b/docs/source/installation.md @@ -12,7 +12,7 @@ This document describes how to install vllm-ascend manually. | Software | Supported version | Note | | ------------ | ----------------- | ---- | | CANN | >= 8.0.0 | Required for vllm-ascend and torch-npu | - | torch-npu | >= 2.5.1.dev20250226 | Required for vllm-ascend | + | torch-npu | >= 2.5.1.dev20250307 | Required for vllm-ascend | | torch | >= 2.5.1 | Required for torch-npu and vllm | You have 2 way to install: @@ -150,15 +150,15 @@ Current version depends on a unreleased `torch-npu`, you need to install manuall # # Here we take python 3.10 on aarch64 as an example. Feel free to install the correct version for your environment. See: # -# https://pytorch-package.obs.cn-north-4.myhuaweicloud.com/pta/Daily/v2.5.1/20250226.4/pytorch_v2.5.1_py39.tar.gz -# https://pytorch-package.obs.cn-north-4.myhuaweicloud.com/pta/Daily/v2.5.1/20250226.4/pytorch_v2.5.1_py310.tar.gz -# https://pytorch-package.obs.cn-north-4.myhuaweicloud.com/pta/Daily/v2.5.1/20250226.4/pytorch_v2.5.1_py311.tar.gz +# https://pytorch-package.obs.cn-north-4.myhuaweicloud.com/pta/Daily/v2.5.1/20250307.3/pytorch_v2.5.1_py39.tar.gz +# https://pytorch-package.obs.cn-north-4.myhuaweicloud.com/pta/Daily/v2.5.1/20250307.3/pytorch_v2.5.1_py310.tar.gz +# https://pytorch-package.obs.cn-north-4.myhuaweicloud.com/pta/Daily/v2.5.1/20250307.3/pytorch_v2.5.1_py311.tar.gz # mkdir pta cd pta -wget https://pytorch-package.obs.cn-north-4.myhuaweicloud.com/pta/Daily/v2.5.1/20250226.4/pytorch_v2.5.1_py310.tar.gz +wget https://pytorch-package.obs.cn-north-4.myhuaweicloud.com/pta/Daily/v2.5.1/20250307.3/pytorch_v2.5.1_py310.tar.gz tar -xvf pytorch_v2.5.1_py310.tar.gz -pip install ./torch_npu-2.5.1.dev20250226-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl +pip install ./torch_npu-2.5.1.dev20250307-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl ``` :::: diff --git a/docs/source/tutorials.md b/docs/source/tutorials.md index 08a07bd..a81e038 100644 --- a/docs/source/tutorials.md +++ b/docs/source/tutorials.md @@ -212,7 +212,9 @@ Prompt: 'The future of AI is', Generated text: ' following you. As the technolog Run docker container on each machine: -```shell +```{code-block} bash + :substitutions: + docker run \ --name vllm-ascend \ --device /dev/davinci0 \ @@ -233,7 +235,7 @@ docker run \ -v /etc/ascend_install.info:/etc/ascend_install.info \ -v /root/.cache:/root/.cache \ -p 8000:8000 \ --it quay.io/ascend/vllm-ascend:v0.7.1rc1 bash +-it quay.io/ascend/vllm-ascend:|vllm_ascend_version| bash ``` Choose one machine as head node, the other are worker nodes, then start ray on each machine: diff --git a/pta_install.sh b/pta_install.sh index 8ca7db0..afb6da0 100755 --- a/pta_install.sh +++ b/pta_install.sh @@ -2,14 +2,14 @@ set -ex mkdir pta cd pta || exit -wget https://pytorch-package.obs.cn-north-4.myhuaweicloud.com/pta/Daily/v2.5.1/20250226.4/pytorch_v2.5.1_py310.tar.gz +wget https://pytorch-package.obs.cn-north-4.myhuaweicloud.com/pta/Daily/v2.5.1/20250307.3/pytorch_v2.5.1_py310.tar.gz tar -zxvf pytorch_v2.5.1_py310.tar.gz if [ "$(uname -i)" == "aarch64" ] then - pip install ./torch_npu-2.5.1.dev20250226-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl + pip install ./torch_npu-2.5.1.dev20250307-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl else - pip install ./torch_npu-2.5.1.dev20250226-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl --extra-index https://download.pytorch.org/whl/cpu/ + pip install ./torch_npu-2.5.1.dev20250307-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl --extra-index https://download.pytorch.org/whl/cpu/ fi cd ..