chore: upgrade sgl-kernel v0.1.8.post2 (#7186)
Co-authored-by: zhyncs <me@zhyncs.com>
This commit is contained in:
@@ -280,6 +280,7 @@ class CutlassMLABackend(FlashInferMLAAttnBackend):
|
||||
seq_lens=forward_batch.seq_lens.to(torch.int32),
|
||||
page_table=self.forward_metadata.block_kv_indices,
|
||||
workspace=self.forward_metadata.workspace,
|
||||
sm_scale=layer.scaling,
|
||||
num_kv_splits=1,
|
||||
)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user