[Bug fix] Fix ascend mla in aclgraph (#9925)
This commit is contained in:
@@ -368,7 +368,7 @@ class AscendAttnBackend(AttentionBackend):
|
|||||||
-1, layer.tp_v_head_num, self.page_size, self.kv_lora_rank
|
-1, layer.tp_v_head_num, self.page_size, self.kv_lora_rank
|
||||||
)
|
)
|
||||||
|
|
||||||
q_nope = q.view(-1, layer.tp_q_head_num, 1, self.kv_lora_rank)
|
q_nope = q.view(-1, layer.tp_q_head_num, 1, self.kv_lora_rank).contiguous()
|
||||||
q_rope = q_rope.view(-1, layer.tp_q_head_num, 1, self.qk_rope_head_dim)
|
q_rope = q_rope.view(-1, layer.tp_q_head_num, 1, self.qk_rope_head_dim)
|
||||||
if self.forward_metadata.seq_lens_cpu_int is None:
|
if self.forward_metadata.seq_lens_cpu_int is None:
|
||||||
actual_seq_len_kv = self.forward_metadata.seq_lens_cpu_list
|
actual_seq_len_kv = self.forward_metadata.seq_lens_cpu_list
|
||||||
|
|||||||
Reference in New Issue
Block a user