fix: only compile ApplyTokenBitmaskInplace cu124+ (#5686)

2025-04-23 14:17:42 -07:00
parent b1f6d89b5f
commit ce4ecba477
1 changed files with 3 additions and 0 deletions
--- a/sgl-kernel/csrc/grammar/apply_token_bitmask_inplace_cuda.cu
+++ b/sgl-kernel/csrc/grammar/apply_token_bitmask_inplace_cuda.cu
@@ -26,6 +26,8 @@
 #include <ATen/cuda/CUDAContext.h>
 // clang-format on

+#if defined CUDA_VERSION && CUDA_VERSION >= 12040
+
 #ifndef CUDART_INF_FP16
 #define CUDART_INF_FP16 __ushort_as_half((unsigned short)0x7C00U)
 #endif
@@ -249,3 +251,4 @@ void ApplyTokenBitmaskInplace(at::Tensor logits, at::Tensor bitmask, at::optiona
      break;
  }
 }
+#endif