feat: add fast_decode_plan from flashinfer, flashinfer to 0.4.0rc3 (#10760)
Co-authored-by: Zihao Ye <yezihhhao@gmail.com> Co-authored-by: Sleepcoo <Sleepcoo@gmail.com>
This commit is contained in:
@@ -62,7 +62,7 @@ dependencies = [
|
||||
"torchaudio==2.8.0",
|
||||
"torchvision",
|
||||
"cuda-python",
|
||||
"flashinfer_python==0.4.0rc1",
|
||||
"flashinfer_python==0.4.0rc3",
|
||||
"openai==1.99.1",
|
||||
"tiktoken",
|
||||
"anthropic>=0.20.0",
|
||||
|
||||
Reference in New Issue
Block a user