From c04a8a820bd45248ed71f677bda43cd977a137e8 Mon Sep 17 00:00:00 2001 From: JieXin Liang Date: Sat, 5 Jul 2025 19:02:14 +0800 Subject: [PATCH] [fix] fix misusing of is_cuda (#7790) --- python/sglang/srt/models/deepseek_v2.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sglang/srt/models/deepseek_v2.py b/python/sglang/srt/models/deepseek_v2.py index f254a7b3e..044fed350 100644 --- a/python/sglang/srt/models/deepseek_v2.py +++ b/python/sglang/srt/models/deepseek_v2.py @@ -913,7 +913,7 @@ class DeepseekV2AttentionMLA(nn.Module): and self.fused_qkv_a_proj_with_mqa.weight.dtype == torch.bfloat16 and self.fused_qkv_a_proj_with_mqa.weight.shape[0] == 2112 and self.fused_qkv_a_proj_with_mqa.weight.shape[1] == 7168 - and is_cuda + and _is_cuda and _device_sm >= 90 )