linear support deepgemm (#4199)

Co-authored-by: yinfan98 <1106310035@qq.com>
2025-03-11 15:38:37 +08:00
parent 4d27eb9ad1
commit dce303e279
3 changed files with 76 additions and 44 deletions
--- a/test/srt/test_fp8_kernel.py
+++ b/test/srt/test_fp8_kernel.py
@@ -17,7 +17,7 @@ class TestFP8Base(unittest.TestCase):
        cls.K = 512
        cls.group_size = 128
        cls.quant_type = torch.float8_e4m3fn
-        cls.output_type = torch.float16
+        cls.output_type = torch.bfloat16

    @staticmethod
    def _make_A(M, K, group_size, out_dtype):