Add typo checker in pre-commit (#6179)
Co-authored-by: Brayden Zhong <b8zhong@uwaterloo.ca>
This commit is contained in:
@@ -308,7 +308,7 @@ class FlashAttentionBackend(AttentionBackend):
|
||||
), "Sliding window and cross attention are not supported together"
|
||||
|
||||
self.forward_metadata: FlashAttentionMetadata = None
|
||||
# extra metdata for handling speculative decoding topk > 1, extended draft decode and verify
|
||||
# extra metadata for handling speculative decoding topk > 1, extended draft decode and verify
|
||||
self.forward_metadata_spec_decode_expand: FlashAttentionMetadata = None
|
||||
self.max_context_len = model_runner.model_config.context_len
|
||||
self.device = model_runner.device
|
||||
|
||||
@@ -919,7 +919,7 @@ def _fwd_kernel(
|
||||
|
||||
e_max = n_e_max
|
||||
|
||||
# stage 2: compute the trianlge part
|
||||
# stage 2: compute the triangle part
|
||||
|
||||
cur_block_m_end = tl.minimum(cur_seq_len_extend, (cur_block_m + 1) * BLOCK_M)
|
||||
for start_n in range(0, cur_block_m_end, BLOCK_N):
|
||||
|
||||
Reference in New Issue
Block a user