fix: zero_init buffer (#9065)

Co-authored-by: Yineng Zhang <me@zhyncs.com>
This commit is contained in:
eigen
2025-08-14 05:39:09 -04:00
committed by GitHub
parent 3d6be1fbce
commit 4dbf43601d
10 changed files with 27 additions and 16 deletions

View File

@@ -122,6 +122,7 @@ class FlashInferAttnBackend(AttentionBackend):
# Allocate buffers
global global_workspace_buffer
if global_workspace_buffer is None:
# different from flashinfer zero_init_global_workspace_buffer
global_workspace_buffer = torch.empty(
global_config.flashinfer_workspace_size,
dtype=torch.uint8,