[fix] fix illegal mem access and clean up triton attention backend (#4571)
This commit is contained in:
@@ -265,7 +265,8 @@ class TestTritonAttention(unittest.TestCase):
|
||||
o,
|
||||
kv_indptr,
|
||||
kv_indices,
|
||||
(attn_logits, attn_lse),
|
||||
attn_logits,
|
||||
attn_lse,
|
||||
num_kv_splits,
|
||||
max_kv_splits,
|
||||
sm_scale,
|
||||
@@ -329,7 +330,8 @@ class TestTritonAttention(unittest.TestCase):
|
||||
o,
|
||||
kv_indptr,
|
||||
kv_indices,
|
||||
(attn_logits, attn_lse),
|
||||
attn_logits,
|
||||
attn_lse,
|
||||
num_kv_splits,
|
||||
max_kv_splits,
|
||||
sm_scale,
|
||||
@@ -353,7 +355,8 @@ class TestTritonAttention(unittest.TestCase):
|
||||
o_grouped,
|
||||
kv_indptr,
|
||||
kv_indices,
|
||||
(attn_logits1, attn_lse1),
|
||||
attn_logits1,
|
||||
attn_lse1,
|
||||
num_kv_splits,
|
||||
max_kv_splits,
|
||||
sm_scale,
|
||||
|
||||
Reference in New Issue
Block a user