diff --git a/python/sglang/srt/models/minicpm.py b/python/sglang/srt/models/minicpm.py index 2df170f38..e7c94c85d 100644 --- a/python/sglang/srt/models/minicpm.py +++ b/python/sglang/srt/models/minicpm.py @@ -138,8 +138,6 @@ class MiniCPMAttention(nn.Module): base=rope_theta, rope_scaling=rope_scaling, ) - # set rope as fp32 instead of bf16 - self.rotary_emb.cos_sin_cache = self.rotary_emb._compute_cos_sin_cache() self.attn = RadixAttention( self.num_heads, self.head_dim,