From 298509008451f7861a848d477829d5816eef12cd Mon Sep 17 00:00:00 2001 From: hlu1 <14827759+hlu1@users.noreply.github.com> Date: Fri, 5 Sep 2025 13:41:01 -0700 Subject: [PATCH] Update flashinfer to 0.3.1 for B300 support (#10087) Signed-off-by: Hao Lu <14827759+hlu1@users.noreply.github.com> --- python/pyproject.toml | 4 ++-- python/sglang/srt/entrypoints/engine.py | 2 +- 2 files changed, 3 insertions(+), 3 deletions(-) mode change 100644 => 100755 python/pyproject.toml diff --git a/python/pyproject.toml b/python/pyproject.toml old mode 100644 new mode 100755 index 0c496484e..973307bdc --- a/python/pyproject.toml +++ b/python/pyproject.toml @@ -63,7 +63,7 @@ srt = [ "torchaudio==2.8.0", "torchvision", "cuda-python", - "flashinfer_python==0.3.0", + "flashinfer_python==0.3.1", ] blackwell = [ @@ -73,7 +73,7 @@ blackwell = [ "torchaudio==2.8.0", "torchvision", "cuda-python", - "flashinfer_python==0.3.0", + "flashinfer_python==0.3.1", ] # HIP (Heterogeneous-computing Interface for Portability) for AMD diff --git a/python/sglang/srt/entrypoints/engine.py b/python/sglang/srt/entrypoints/engine.py index 9155060c8..4b4cdcb34 100644 --- a/python/sglang/srt/entrypoints/engine.py +++ b/python/sglang/srt/entrypoints/engine.py @@ -673,7 +673,7 @@ def _set_envs_and_config(server_args: ServerArgs): if server_args.attention_backend == "flashinfer": assert_pkg_version( "flashinfer_python", - "0.3.0", + "0.3.1", "Please uninstall the old version and " "reinstall the latest version by following the instructions " "at https://docs.flashinfer.ai/installation.html.",