diff --git a/benchmark/mmmu/bench_hf.py b/benchmark/mmmu/bench_hf.py index 6735ce7ec..385171e95 100644 --- a/benchmark/mmmu/bench_hf.py +++ b/benchmark/mmmu/bench_hf.py @@ -1,5 +1,6 @@ import argparse +import PIL import torch from data_utils import save_json from eval_utils import ( diff --git a/python/sglang/srt/managers/multimodal_processors/llava.py b/python/sglang/srt/managers/multimodal_processors/llava.py index 27806af4a..a1b0dc1f7 100644 --- a/python/sglang/srt/managers/multimodal_processors/llava.py +++ b/python/sglang/srt/managers/multimodal_processors/llava.py @@ -8,14 +8,23 @@ from sglang.srt.managers.multimodal_processors.base_processor import ( ) from sglang.srt.managers.schedule_batch import Modality, MultimodalDataItem from sglang.srt.mm_utils import expand2square, process_anyres_image -from sglang.srt.models.llava import LlavaMistralForCausalLM, LlavaQwenForCausalLM +from sglang.srt.models.llava import ( + LlavaLlamaForCausalLM, + LlavaMistralForCausalLM, + LlavaQwenForCausalLM, +) from sglang.srt.models.llavavid import LlavaVidForCausalLM from sglang.srt.utils import load_image, logger from sglang.utils import get_exception_traceback class LlavaImageProcessor(BaseMultimodalProcessor): - models = [LlavaVidForCausalLM, LlavaQwenForCausalLM, LlavaMistralForCausalLM] + models = [ + LlavaLlamaForCausalLM, + LlavaVidForCausalLM, + LlavaQwenForCausalLM, + LlavaMistralForCausalLM, + ] def __init__(self, hf_config, server_args, _processor): super().__init__(hf_config, server_args, _processor)