fix: use fa3 unit test on hopper only (#5304)

This commit is contained in:
Yineng Zhang
2025-04-11 15:10:49 -07:00
committed by GitHub
parent 6f8593799b
commit c1dd773c19

View File

@@ -17,7 +17,7 @@ def is_fa3_supported(device=None) -> bool:
# https://docs.nvidia.com/cuda/cuda-c-programming-guide/#shared-memory-8-x
# now sgl-kernel only build fa3 for sm90a && cuda >= 12.4
return (
(torch.cuda.get_device_capability(device)[0] >= 9)
(torch.cuda.get_device_capability(device)[0] == 9)
and (torch.version.cuda >= "12.4")
# or torch.cuda.get_device_capability(device) == (8, 0)
# or torch.cuda.get_device_capability(device) == (8, 7)