linear support deepgemm (#4199)

Co-authored-by: yinfan98 <1106310035@qq.com>
This commit is contained in:
lukec
2025-03-11 15:38:37 +08:00
committed by GitHub
parent 4d27eb9ad1
commit dce303e279
3 changed files with 76 additions and 44 deletions

View File

@@ -17,7 +17,7 @@ class TestFP8Base(unittest.TestCase):
cls.K = 512
cls.group_size = 128
cls.quant_type = torch.float8_e4m3fn
cls.output_type = torch.float16
cls.output_type = torch.bfloat16
@staticmethod
def _make_A(M, K, group_size, out_dtype):