[bugs] fix install FIA sh (#6989)

### What this PR does / why we need it?
Update the replacement shell script for the FIA operator FD feature in
CANN 8.5.1

- vLLM version: v0.16.0
- vLLM main:
15d76f74e2
---------
Signed-off-by: zjks98 <zhangjiakang4@huawei.com>
Signed-off-by: aipaes <82140963+aipaes@users.noreply.github.com>
Co-authored-by: zjks98 <zhangjiakang4@huawei.com>
This commit is contained in:
aipaes
2026-03-06 11:42:32 +08:00
committed by GitHub
parent 16c3b0b822
commit 620076b76a
2 changed files with 12 additions and 8 deletions

View File

@@ -22,16 +22,18 @@ set -euo pipefail
trap 'echo "Error on line $LINENO: command \`$BASH_COMMAND\` failed with exit code $?" >&2' ERR
cd /vllm-workspace
mkdir -p fused_infer_attention_score_a2_$(uname -i)
# download fused_infer_attention_score related source files
wget https://vllm-ascend.obs.cn-north-4.myhuaweicloud.com/vllm-ascend/cann-8.5.0/fused_infer_attention_score_a2_$(uname -i).tar.gz
tar -zxvf ./fused_infer_attention_score_a2_$(uname -i).tar.gz
wget https://vllm-ascend.obs.cn-north-4.myhuaweicloud.com/vllm-ascend/cann-8.5.1/fused_infer_attention_score_a2_$(uname -i).tar.gz
tar -zxvf ./fused_infer_attention_score_a2_$(uname -i).tar.gz -C ./fused_infer_attention_score_a2_$(uname -i)
# replace fused_infer_attention_score operation files
cd $ASCEND_TOOLKIT_HOME/opp/built-in/op_impl/ai_core/tbe/kernel/ascend910b
cd $ASCEND_TOOLKIT_HOME/opp/built-in/op_impl/ai_core/tbe/kernel/ascend910b/ops_transformer
rm -rf fused_infer_attention_score
cp -r /vllm-workspace/fused_infer_attention_score_a2_$(uname -i)/fused_infer_attention_score .
# replace related so
cd $ASCEND_TOOLKIT_HOME/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/$(uname -i)
rm libopmaster_ct.so libopmaster_rt2.0.so liboptiling.so
rm libopmaster_*.so
rm liboptiling.so
cp /vllm-workspace/fused_infer_attention_score_a2_$(uname -i)/*.so .

View File

@@ -21,16 +21,18 @@ set -euo pipefail
trap 'echo "Error on line $LINENO: command \`$BASH_COMMAND\` failed with exit code $?" >&2' ERR
cd /vllm-workspace
mkdir -p fused_infer_attention_score_a3_$(uname -i)
# download fused_infer_attention_score related source files
wget https://vllm-ascend.obs.cn-north-4.myhuaweicloud.com/vllm-ascend/cann-8.5.0/fused_infer_attention_score_a3_$(uname -i).tar.gz
tar -zxvf ./fused_infer_attention_score_a3_$(uname -i).tar.gz
wget https://vllm-ascend.obs.cn-north-4.myhuaweicloud.com/vllm-ascend/cann-8.5.1/fused_infer_attention_score_a3_$(uname -i).tar.gz
tar -zxvf ./fused_infer_attention_score_a3_$(uname -i).tar.gz -C ./fused_infer_attention_score_a3_$(uname -i)
# replace fused_infer_attention_score operation files
cd $ASCEND_TOOLKIT_HOME/opp/built-in/op_impl/ai_core/tbe/kernel/ascend910_93
cd $ASCEND_TOOLKIT_HOME/opp/built-in/op_impl/ai_core/tbe/kernel/ascend910_93/ops_transformer
rm -rf fused_infer_attention_score
cp -r /vllm-workspace/fused_infer_attention_score_a3_$(uname -i)/fused_infer_attention_score .
# replace related so
cd $ASCEND_TOOLKIT_HOME/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/$(uname -i)
rm libopmaster_ct.so libopmaster_rt2.0.so liboptiling.so
rm libopmaster_*.so
rm liboptiling.so
cp /vllm-workspace/fused_infer_attention_score_a3_$(uname -i)/*.so .