Upgrade CUTLASS 4.0 (#6336)

Co-authored-by: zhyncs <me@zhyncs.com>
This commit is contained in:
Elfie Guo
2025-05-15 17:42:23 -07:00
committed by GitHub
parent e07a6977e7
commit c23a7072b6
2 changed files with 2 additions and 2 deletions

View File

@@ -45,7 +45,7 @@ include(FetchContent)
FetchContent_Declare(
repo-cutlass
GIT_REPOSITORY https://github.com/NVIDIA/cutlass
GIT_TAG ad7b2f5e84fcfa124cb02b91d5bd26d238c0459e
GIT_TAG f115c3f85467d5d9619119d1dbeb9c03c3d73864
GIT_SHALLOW OFF
)
FetchContent_Populate(repo-cutlass)

2
sgl-kernel/csrc/gemm/fp8_blockwise_gemm_kernel.cu Normal file → Executable file
View File

@@ -140,7 +140,7 @@ void launch_sm90_fp8_blockwise_scaled_mm(
LayoutSFB layout_sfb = ScaleConfig::tile_atom_to_shape_SFB(make_shape(m, n, k, 1));
typename GemmKernel::MainloopArguments mainloop_args{
a_ptr, stride_a, b_ptr, stride_b, 4, a_s_ptr, layout_sfa, b_s_ptr, layout_sfb};
a_ptr, stride_a, b_ptr, stride_b, a_s_ptr, layout_sfa, b_s_ptr, layout_sfb};
typename GemmKernel::EpilogueArguments epilogue_args{{}, nullptr, stride_d, o_ptr, stride_d};
typename Gemm::Arguments args = {