diff --git a/python/sglang/srt/models/qwen3_next.py b/python/sglang/srt/models/qwen3_next.py index 245145542..6e6a99cf8 100644 --- a/python/sglang/srt/models/qwen3_next.py +++ b/python/sglang/srt/models/qwen3_next.py @@ -497,7 +497,9 @@ class Qwen3HybridLinearDecoderLayer(nn.Module): ) -> None: super().__init__() self.config = config - self.linear_attn = Qwen3GatedDeltaNet(config, layer_id, quant_config, alt_stream) + self.linear_attn = Qwen3GatedDeltaNet( + config, layer_id, quant_config, alt_stream + ) # Qwen3Next all layers are sparse and have no nextn now self.is_layer_sparse = True