Fix GPU OOM (#6564)

Co-authored-by: michael <michael.zhang@amd.com>
This commit is contained in:
kk
2025-05-25 07:38:39 +08:00
committed by GitHub
parent 24c035f2e3
commit 7a5e6ce1cb
8 changed files with 15 additions and 16 deletions

View File

@@ -506,6 +506,7 @@ class AiterIndicesUpdaterPrefill:
spec_info.generate_attn_arg_prefill(
req_pool_indices,
paged_kernel_lens,
None,
self.req_to_token,
)
)