[Fix] fix the typo bug for window attention (#1106)

This commit is contained in:
Ying Sheng
2024-08-14 21:56:01 -07:00
committed by GitHub
parent 326df4bab2
commit 8d2d876fc8

View File

@@ -337,7 +337,7 @@ class ModelRunner:
use_tensor_cores=use_tensor_cores,
)
else:
self.flashinfer_workspace_buffers = torch.empty(
self.flashinfer_workspace_buffer = torch.empty(
global_config.flashinfer_workspace_size,
dtype=torch.uint8,
device="cuda",