set default attention backend for deterministic inference (#11801)

2025-10-18 00:01:24 -07:00
parent e68a2b5b2f
commit f4488e9dd9
2 changed files with 26 additions and 2 deletions
--- a/python/sglang/srt/utils/common.py
+++ b/python/sglang/srt/utils/common.py
@@ -174,6 +174,15 @@ def is_blackwell():
    return torch.cuda.get_device_capability()[0] == 10


+@lru_cache(maxsize=1)
+def is_sm120_supported(device=None) -> bool:
+    if not is_cuda_alike():
+        return False
+    return (torch.cuda.get_device_capability(device)[0] == 12) and (
+        torch.version.cuda >= "12.8"
+    )
+
+
@lru_cache(maxsize=1)
 def is_sm100_supported(device=None) -> bool:
    if not is_cuda_alike():