[bugfix] matmul_allreduce_add_rmsnorm aclnn interface (#5082)
What this PR does / why we need it? a2 kernel aclnn interface extern "C" fix Does this PR introduce any user-facing change? No How was this patch tested? vLLM version: v0.12.0 Signed-off-by: tongrunze <t00574058@china.huawei.com> Co-authored-by: tongrunze <t00574058@china.huawei.com>
This commit is contained in:
@@ -26,6 +26,10 @@ enum NnopbaseHcclServerType {
|
|||||||
};
|
};
|
||||||
extern "C" void __attribute__((weak)) NnopbaseSetHcclServerType(void *executor, NnopbaseHcclServerType sType);
|
extern "C" void __attribute__((weak)) NnopbaseSetHcclServerType(void *executor, NnopbaseHcclServerType sType);
|
||||||
|
|
||||||
|
#ifdef __cplusplus
|
||||||
|
extern "C" {
|
||||||
|
#endif
|
||||||
|
|
||||||
extern aclnnStatus aclnnInnerMatmulAllreduceAddRmsnormGetWorkspaceSize(
|
extern aclnnStatus aclnnInnerMatmulAllreduceAddRmsnormGetWorkspaceSize(
|
||||||
const aclTensor *x1,
|
const aclTensor *x1,
|
||||||
const aclTensor *x2,
|
const aclTensor *x2,
|
||||||
@@ -48,10 +52,6 @@ extern aclnnStatus aclnnInnerMatmulAllreduceAddRmsnorm(
|
|||||||
aclOpExecutor *executor,
|
aclOpExecutor *executor,
|
||||||
aclrtStream stream);
|
aclrtStream stream);
|
||||||
|
|
||||||
#ifdef __cplusplus
|
|
||||||
extern "C" {
|
|
||||||
#endif
|
|
||||||
|
|
||||||
aclnnStatus aclnnMatmulAllreduceAddRmsnormGetWorkspaceSize(
|
aclnnStatus aclnnMatmulAllreduceAddRmsnormGetWorkspaceSize(
|
||||||
const aclTensor *x1,
|
const aclTensor *x1,
|
||||||
const aclTensor *x2,
|
const aclTensor *x2,
|
||||||
|
|||||||
Reference in New Issue
Block a user