Upgrade to vllm 0.17.0 corex v4.1 overlay
This commit is contained in:
@@ -409,7 +409,7 @@ class Gemma3nAttention(nn.Module):
|
||||
) -> torch.Tensor:
|
||||
qkv, _ = self.qkv_proj(hidden_states)
|
||||
q, k, v = qkv.split([self.q_size, self.kv_size, self.kv_size], dim=-1)
|
||||
|
||||
q, k, v = q.contiguous(), k.contiguous(), v.contiguous()
|
||||
q = q.unflatten(-1, (self.num_heads, self.head_dim))
|
||||
q = self.q_norm(q)
|
||||
q = q.flatten(-2, -1)
|
||||
|
||||
Reference in New Issue
Block a user