fix: only compile ApplyTokenBitmaskInplace cu124+ (#5686)
This commit is contained in:
@@ -26,6 +26,8 @@
|
|||||||
#include <ATen/cuda/CUDAContext.h>
|
#include <ATen/cuda/CUDAContext.h>
|
||||||
// clang-format on
|
// clang-format on
|
||||||
|
|
||||||
|
#if defined CUDA_VERSION && CUDA_VERSION >= 12040
|
||||||
|
|
||||||
#ifndef CUDART_INF_FP16
|
#ifndef CUDART_INF_FP16
|
||||||
#define CUDART_INF_FP16 __ushort_as_half((unsigned short)0x7C00U)
|
#define CUDART_INF_FP16 __ushort_as_half((unsigned short)0x7C00U)
|
||||||
#endif
|
#endif
|
||||||
@@ -249,3 +251,4 @@ void ApplyTokenBitmaskInplace(at::Tensor logits, at::Tensor bitmask, at::optiona
|
|||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
|
|||||||
Reference in New Issue
Block a user