Support Dots.ocr model (#11071)

This commit is contained in:
qrskannbara
2025-10-01 03:18:39 +08:00
committed by GitHub
parent a6cc86df9d
commit fb367acfcb
6 changed files with 244 additions and 3 deletions

View File

@@ -5,6 +5,7 @@ from typing import Dict, List, Union
from PIL import Image
from sglang.srt.models.dots_ocr import DotsOCRForCausalLM
from sglang.srt.models.dots_vlm import DotsVLMForCausalLM
from sglang.srt.multimodal.processors.base_processor import (
BaseMultimodalProcessor,
@@ -14,7 +15,7 @@ from sglang.srt.multimodal.processors.qwen_vl import resize_image_async
class DotsVLMImageProcessor(BaseMultimodalProcessor):
models = [DotsVLMForCausalLM]
models = [DotsVLMForCausalLM, DotsOCRForCausalLM]
def __init__(self, hf_config, server_args, _processor, *args, **kwargs):
super().__init__(hf_config, server_args, _processor, *args, **kwargs)
@@ -82,11 +83,9 @@ class DotsVLMImageProcessor(BaseMultimodalProcessor):
for image in base_output.images
]
base_output.images = await asyncio.gather(*resize_tasks)
combined_mm_item, input_ids, _ = self.process_and_combine_mm_data(
base_output, self.mm_tokens
)
if combined_mm_item is None:
return None