Signed-off-by: Shangming Cai <csmthu@gmail.com>
This commit is contained in:
@@ -497,7 +497,9 @@ class Qwen3HybridLinearDecoderLayer(nn.Module):
|
|||||||
) -> None:
|
) -> None:
|
||||||
super().__init__()
|
super().__init__()
|
||||||
self.config = config
|
self.config = config
|
||||||
self.linear_attn = Qwen3GatedDeltaNet(config, layer_id, quant_config, alt_stream)
|
self.linear_attn = Qwen3GatedDeltaNet(
|
||||||
|
config, layer_id, quant_config, alt_stream
|
||||||
|
)
|
||||||
|
|
||||||
# Qwen3Next all layers are sparse and have no nextn now
|
# Qwen3Next all layers are sparse and have no nextn now
|
||||||
self.is_layer_sparse = True
|
self.is_layer_sparse = True
|
||||||
|
|||||||
Reference in New Issue
Block a user