fix: solve cu118 issue for cutlass mla (#5331)

This commit is contained in:
Yineng Zhang
2025-04-12 12:51:09 -07:00
committed by GitHub
parent 4879e50c6d
commit 812e82f35e
3 changed files with 17 additions and 7 deletions

View File

@@ -25,6 +25,8 @@ limitations under the License.
#include <device/sm100_mla.hpp>
#include <kernel/sm100_mla_tile_scheduler.hpp>
#if defined CUDA_VERSION && CUDA_VERSION >= 12040
#define CUTLASS_CHECK(status) \
{ \
cutlass::Status error = status; \
@@ -205,3 +207,5 @@ int64_t cutlass_mla_get_workspace_size(int64_t max_seq_len, int64_t num_batches,
return MlaSm100Type::Fmha::get_workspace_size(arguments);
}
#endif