Files
xc-llm-ascend/csrc/cmake/scripts/prepare.sh
Chenxi Qian 554f16ae1f [Kernel] add custom op GmmSwigluQuantWeightNzTensorList (#3804)
### What this PR does / why we need it?

This PR introduces support for adding custom CANN `aclnn` ops to
`vllm-ascend`, allowing users to define and use their own custom
operators.

Key changes include:
- Building and installing custom ops into the `vllm-ascend`-specified
directory
- Binding the `aclnn` op interface to the `torch.ops._C_ascend` module
- Enabling invocation of these ops within `vllm-ascend`

This PR includes a sample custom op:
`aclnnGroupedMatmulSwigluQuantWeightNzTensorList`, which is adapted from
the CANN operator
[`aclnnGroupedMatmulSwigluQuantWeightNZ`](https://www.hiascend.com/document/detail/zh/canncommercial/83RC1/API/aolapi/context/aclnnGroupedMatmulSwigluQuantWeightNZ.md).
Its input parameters `weight` and `weight_scale` now accept
`list[torch.Tensor]` (i.e., `at::TensorList`).

### Does this PR introduce _any_ user-facing change?

No.


- vLLM version: v0.11.2

---------

Signed-off-by: QianChenxi <chenxi.qian.cq@outlook.com>
2025-11-28 18:06:39 +08:00

131 lines
3.4 KiB
Bash

#!/bin/bash
# Copyright (c) 2024 Huawei Technologies Co., Ltd.
# This file is a part of the CANN Open Software.
# Licensed under CANN Open Software License Agreement Version 1.0 (the "License").
# Please refer to the License for details. You may not use this file except in compliance with the License.
# THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, EITHER EXPRESS OR IMPLIED,
# INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, MERCHANTABILITY, OR FITNESS FOR A PARTICULAR PURPOSE.
# See LICENSE in the root of the software repository for the full text of the License.
# ======================================================================================================================
CPU_NUM=$(($(cat /proc/cpuinfo | grep "^processor" | wc -l)*2))
JOB_NUM="-j${CPU_NUM}"
while [[ $# -gt 0 ]]; do
case $1 in
-s)
PATH_TO_SOURCE="$2"
shift 2
;;
-b)
PATH_TO_BUILD="$2"
shift 2
;;
-p)
ASCEND_CANN_PACKAGE_PATH="$2"
shift 2
;;
--autogen-dir)
ASCEND_AUTOGEN_DIR="$2"
shift 2
;;
--build-open-project)
BUILD_OPEN_PROJECT="$2"
shift 2
;;
--binary-out-dir)
ASCEND_BINARY_OUT_DIR="$2"
shift 2
;;
--impl-out-dir)
ASCEND_IMPL_OUT_DIR="$2"
shift 2
;;
--op-build-tool)
OP_BUILD_TOOL="$2"
shift 2
;;
--ascend-cmake-dir)
ASCEND_CMAKE_DIR="$2"
shift 2
;;
--tiling-key)
TILING_KEY="$2"
shift 2
;;
--ops-compile-options)
OPS_COMPILE_OPTIONS="$2"
shift 2
;;
--check-compatible)
CHECK_COMPATIBLE="$2"
shift 2
;;
--ascend-compute_unit)
ASCEND_COMPUTE_UNIT="$2"
shift 2
;;
--ascend-op-name)
ASCEND_OP_NAME="$2"
shift 2
;;
--op_debug_config)
OP_DEBUG_CONFIG="$2"
shift 2
;;
*)
break
;;
esac
done
function clean() {
if [ -n "${PATH_TO_BUILD}" ];then
rm -rf ${PATH_TO_BUILD}
mkdir -p ${PATH_TO_BUILD}
fi
}
function convert_string() {
local _input=$1
_output=$(echo $_input | sed 's/::/;/g')
echo "${_output}"
}
function set_env() {
CONVERT_TILING_KEY="$(convert_string ${TILING_KEY})"
CONVERT_OPS_COMPILE_OPTIONS="$(convert_string ${OPS_COMPILE_OPTIONS})"
CONVERT_ASCEND_COMPUTE_UNIT="$(convert_string ${ASCEND_COMPUTE_UNIT})"
}
function build() {
cd ${PATH_TO_BUILD}
cmake ${PATH_TO_SOURCE} \
-DBUILD_OPEN_PROJECT=${BUILD_OPEN_PROJECT} \
-DPREPARE_BUILD=ON \
-DCUSTOM_ASCEND_CANN_PACKAGE_PATH=${ASCEND_CANN_PACKAGE_PATH} \
-DASCEND_AUTOGEN_DIR=${ASCEND_AUTOGEN_DIR} \
-DASCEND_BINARY_OUT_DIR=${ASCEND_BINARY_OUT_DIR} \
-DASCEND_IMPL_OUT_DIR=${ASCEND_IMPL_OUT_DIR} \
-DOP_BUILD_TOOL=${OP_BUILD_TOOL} \
-DASCEND_CMAKE_DIR=${ASCEND_CMAKE_DIR} \
-DCHECK_COMPATIBLE=${CHECK_COMPATIBLE} \
-DTILING_KEY="${CONVERT_TILING_KEY}" \
-DOPS_COMPILE_OPTIONS="${CONVERT_OPS_COMPILE_OPTIONS}" \
-DASCEND_COMPUTE_UNIT=${CONVERT_ASCEND_COMPUTE_UNIT} \
-DOP_DEBUG_CONFIG=${OP_DEBUG_CONFIG} \
-DASCEND_OP_NAME=${ASCEND_OP_NAME}
make ${JOB_NUM} prepare_build
}
function main() {
clean
set_env
build
}
main