[2/2] Support MHA prefill with FlashAttention 4. (#10937)

Co-authored-by: Hieu Pham <hyhieu@gmail.com>
This commit is contained in:
Lifu Huang
2025-10-08 00:54:20 -07:00
committed by GitHub
parent 97cd38e58d
commit edefab0c64
7 changed files with 34 additions and 23 deletions

View File

@@ -53,7 +53,7 @@ dependencies = [
"scipy",
"sentencepiece",
"setproctitle",
"sgl-kernel==0.3.14.post1",
"sgl-kernel==0.3.15",
"soundfile==0.13.1",
"tiktoken",
"timm==1.0.16",