Add PDL support for quant kernel and rope kernel (#9106)

2025-08-20 16:56:29 +08:00
parent c9bf3877a0
commit 42c8704560
7 changed files with 80 additions and 33 deletions
--- a/sgl-kernel/include/sgl_kernel_ops.h
+++ b/sgl-kernel/include/sgl_kernel_ops.h
@@ -151,6 +151,7 @@ void apply_rope_pos_ids_cos_sin_cache(
    at::Tensor cos_sin_cache,
    at::Tensor pos_ids,
    bool interleave,
+    bool enable_pdl,
    int64_t cuda_stream,
    const std::optional<at::Tensor>& v,
    const std::optional<at::Tensor>& k_buffer,