### What this PR does / why we need it? This PR introduces support for adding custom CANN `aclnn` ops to `vllm-ascend`, allowing users to define and use their own custom operators. Key changes include: - Building and installing custom ops into the `vllm-ascend`-specified directory - Binding the `aclnn` op interface to the `torch.ops._C_ascend` module - Enabling invocation of these ops within `vllm-ascend` This PR includes a sample custom op: `aclnnGroupedMatmulSwigluQuantWeightNzTensorList`, which is adapted from the CANN operator [`aclnnGroupedMatmulSwigluQuantWeightNZ`](https://www.hiascend.com/document/detail/zh/canncommercial/83RC1/API/aolapi/context/aclnnGroupedMatmulSwigluQuantWeightNZ.md). Its input parameters `weight` and `weight_scale` now accept `list[torch.Tensor]` (i.e., `at::TensorList`). ### Does this PR introduce _any_ user-facing change? No. - vLLM version: v0.11.2 --------- Signed-off-by: QianChenxi <chenxi.qian.cq@outlook.com>
76 lines
3.6 KiB
CMake
76 lines
3.6 KiB
CMake
# Copyright (c) 2024 Huawei Technologies Co., Ltd.
|
|
# This file is a part of the CANN Open Software.
|
|
# Licensed under CANN Open Software License Agreement Version 1.0 (the "License").
|
|
# Please refer to the License for details. You may not use this file except in compliance with the License.
|
|
# THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, EITHER EXPRESS OR IMPLIED,
|
|
# INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, MERCHANTABILITY, OR FITNESS FOR A PARTICULAR PURPOSE.
|
|
# See LICENSE in the root of the software repository for the full text of the License.
|
|
# ======================================================================================================================
|
|
|
|
# Custom package scenario, public compilation configuration for Host side targets
|
|
# Note: To ensure compatibility with the built-in package compilation process, the intf_pub name cannot be changed
|
|
add_library(intf_pub INTERFACE)
|
|
target_include_directories(intf_pub
|
|
INTERFACE
|
|
${ASCEND_CANN_PACKAGE_PATH}/include
|
|
${ASCEND_CANN_PACKAGE_PATH}/include/external
|
|
${ASCEND_CANN_PACKAGE_PATH}/include/experiment/platform
|
|
${ASCEND_CANN_PACKAGE_PATH}/include/experiment/runtime
|
|
${ASCEND_CANN_PACKAGE_PATH}/include/experiment/msprof
|
|
)
|
|
target_link_directories(intf_pub
|
|
INTERFACE
|
|
${ASCEND_CANN_PACKAGE_PATH}/lib64
|
|
)
|
|
target_compile_options(intf_pub
|
|
INTERFACE
|
|
-fPIC
|
|
-O2
|
|
-Wall -Wundef -Wcast-qual -Wpointer-arith -Wdate-time
|
|
-Wfloat-equal -Wformat=2 -Wshadow
|
|
-Wsign-compare -Wunused-macros -Wvla -Wdisabled-optimization -Wempty-body -Wignored-qualifiers
|
|
-Wimplicit-fallthrough=3 -Wtype-limits -Wshift-negative-value -Wswitch-default
|
|
-Wframe-larger-than=32768 -Woverloaded-virtual
|
|
-Wnon-virtual-dtor -Wshift-overflow=2 -Wshift-count-overflow
|
|
-Wwrite-strings -Wmissing-format-attribute -Wformat-nonliteral
|
|
-Wdelete-non-virtual-dtor -Wduplicated-cond
|
|
-Wtrampolines -Wsized-deallocation -Wlogical-op -Wsuggest-attribute=format
|
|
-Wduplicated-branches
|
|
-Wmissing-include-dirs -Wformat-signedness
|
|
-Wreturn-local-addr -Wextra
|
|
-Wredundant-decls -Wfloat-conversion
|
|
-Wno-write-strings -Wall -Wno-dangling-else -Wno-comment -Wno-conversion-null -Wno-return-type
|
|
-Wno-unknown-pragmas -Wno-sign-compare
|
|
-Wno-error=undef
|
|
-Wno-error=comment
|
|
-Wno-error=conversion-null
|
|
-Wno-error=dangling-else
|
|
-Wno-error=return-type
|
|
-Wno-error=shadow
|
|
-Wno-error=sign-compare
|
|
-Wno-error=unknown-pragmas
|
|
-Wno-error=unused-parameter
|
|
-Wno-error=cast-qual
|
|
-Wno-error=format=
|
|
-Wno-error=maybe-uninitialized
|
|
-Wno-error=missing-field-initializers
|
|
-Wno-error=redundant-decls
|
|
-Wno-error=unused-variable
|
|
$<$<COMPILE_LANGUAGE:C>:-Wnested-externs>
|
|
$<$<CONFIG:Debug>:-g>
|
|
$<IF:$<VERSION_GREATER:${CMAKE_C_COMPILER_VERSION},4.8.5>,-fstack-protector-strong,-fstack-protector-all>
|
|
)
|
|
target_compile_definitions(intf_pub
|
|
INTERFACE
|
|
$<$<COMPILE_LANGUAGE:CXX>:_GLIBCXX_USE_CXX11_ABI=0>
|
|
$<$<CONFIG:Release>:_FORTIFY_SOURCE=2>
|
|
)
|
|
target_link_options(intf_pub
|
|
INTERFACE
|
|
$<$<STREQUAL:$<TARGET_PROPERTY:TYPE>,EXECUTABLE>:-pie>
|
|
$<$<CONFIG:Release>:-s>
|
|
-Wl,-z,relro
|
|
-Wl,-z,now
|
|
-Wl,-z,noexecstack
|
|
)
|