@@ -45,7 +45,7 @@ include(FetchContent)
|
|||||||
FetchContent_Declare(
|
FetchContent_Declare(
|
||||||
repo-cutlass
|
repo-cutlass
|
||||||
GIT_REPOSITORY https://github.com/NVIDIA/cutlass
|
GIT_REPOSITORY https://github.com/NVIDIA/cutlass
|
||||||
GIT_TAG ad7b2f5e84fcfa124cb02b91d5bd26d238c0459e
|
GIT_TAG f115c3f85467d5d9619119d1dbeb9c03c3d73864
|
||||||
GIT_SHALLOW OFF
|
GIT_SHALLOW OFF
|
||||||
)
|
)
|
||||||
FetchContent_Populate(repo-cutlass)
|
FetchContent_Populate(repo-cutlass)
|
||||||
|
|||||||
2
sgl-kernel/csrc/gemm/fp8_blockwise_gemm_kernel.cu
Normal file → Executable file
2
sgl-kernel/csrc/gemm/fp8_blockwise_gemm_kernel.cu
Normal file → Executable file
@@ -140,7 +140,7 @@ void launch_sm90_fp8_blockwise_scaled_mm(
|
|||||||
LayoutSFB layout_sfb = ScaleConfig::tile_atom_to_shape_SFB(make_shape(m, n, k, 1));
|
LayoutSFB layout_sfb = ScaleConfig::tile_atom_to_shape_SFB(make_shape(m, n, k, 1));
|
||||||
|
|
||||||
typename GemmKernel::MainloopArguments mainloop_args{
|
typename GemmKernel::MainloopArguments mainloop_args{
|
||||||
a_ptr, stride_a, b_ptr, stride_b, 4, a_s_ptr, layout_sfa, b_s_ptr, layout_sfb};
|
a_ptr, stride_a, b_ptr, stride_b, a_s_ptr, layout_sfa, b_s_ptr, layout_sfb};
|
||||||
typename GemmKernel::EpilogueArguments epilogue_args{{}, nullptr, stride_d, o_ptr, stride_d};
|
typename GemmKernel::EpilogueArguments epilogue_args{{}, nullptr, stride_d, o_ptr, stride_d};
|
||||||
|
|
||||||
typename Gemm::Arguments args = {
|
typename Gemm::Arguments args = {
|
||||||
|
|||||||
Reference in New Issue
Block a user