Add PDL support for quant kernel and rope kernel (#9106)

This commit is contained in:
fzyzcjy
2025-08-20 16:56:29 +08:00
committed by GitHub
parent c9bf3877a0
commit 42c8704560
7 changed files with 80 additions and 33 deletions

View File

@@ -151,6 +151,7 @@ void apply_rope_pos_ids_cos_sin_cache(
at::Tensor cos_sin_cache,
at::Tensor pos_ids,
bool interleave,
bool enable_pdl,
int64_t cuda_stream,
const std::optional<at::Tensor>& v,
const std::optional<at::Tensor>& k_buffer,