Support copying tensor from cpu to gpu without using copy engines (#10007)

This commit is contained in:
fzyzcjy
2025-09-05 20:07:19 +08:00
committed by GitHub
parent 5e5c30d9ab
commit bd7f882142
6 changed files with 70 additions and 1 deletions

View File

@@ -247,6 +247,7 @@ set(SOURCES
"csrc/attention/vertical_slash_index.cu"
"csrc/elementwise/activation.cu"
"csrc/elementwise/cast.cu"
"csrc/elementwise/copy.cu"
"csrc/elementwise/fused_add_rms_norm_kernel.cu"
"csrc/elementwise/rope.cu"
"csrc/common_extension.cc"