From 67e53b16f5f18fdfb2a08a42b77af8dd29057459 Mon Sep 17 00:00:00 2001 From: Lifu Huang Date: Wed, 30 Jul 2025 19:50:54 -0700 Subject: [PATCH] Bump transfomers to 4.54.1 to fix Gemma cache issue. (#8541) --- python/pyproject.toml | 2 +- test/srt/models/test_generation_models.py | 3 +-- 2 files changed, 2 insertions(+), 3 deletions(-) diff --git a/python/pyproject.toml b/python/pyproject.toml index 980cb6f8c..1924352d0 100644 --- a/python/pyproject.toml +++ b/python/pyproject.toml @@ -45,7 +45,7 @@ runtime_common = [ "soundfile==0.13.1", "scipy", "torchao==0.9.0", - "transformers==4.54.0", + "transformers==4.54.1", "timm==1.0.16", "uvicorn", "uvloop", diff --git a/test/srt/models/test_generation_models.py b/test/srt/models/test_generation_models.py index 4ed9d4e12..daa99001d 100644 --- a/test/srt/models/test_generation_models.py +++ b/test/srt/models/test_generation_models.py @@ -51,8 +51,7 @@ class ModelCase: # Popular models that run on the CI CI_MODELS = [ ModelCase("meta-llama/Llama-3.1-8B-Instruct"), - # TODO: Gemma is broken by the bug introduced in the latest transformers version, we should restore once its fixed: https://github.com/huggingface/transformers/issues/39711 - # ModelCase("google/gemma-2-2b"), + ModelCase("google/gemma-2-2b"), ] # the complete set of models to test sglang's generation model