diff --git a/python/sglang/srt/conversation.py b/python/sglang/srt/conversation.py index 29ecb7abd..6f07d0946 100644 --- a/python/sglang/srt/conversation.py +++ b/python/sglang/srt/conversation.py @@ -4,7 +4,7 @@ import dataclasses from enum import IntEnum, auto from typing import Dict, List, Optional, Tuple, Union -from sglang.srt.managers.openai_protocol import ChatCompletionRequest +from sglang.srt.openai_protocol import ChatCompletionRequest class SeparatorStyle(IntEnum): diff --git a/python/sglang/srt/managers/io_struct.py b/python/sglang/srt/managers/io_struct.py index a99498949..6e64380c9 100644 --- a/python/sglang/srt/managers/io_struct.py +++ b/python/sglang/srt/managers/io_struct.py @@ -25,6 +25,7 @@ class GenerateReqInput: return_text_in_logprobs: bool = False # Whether to stream output stream: bool = False + # TODO: make all parameters a Union[List[T], T] to allow for batched requests def post_init(self): is_single = isinstance(self.text, str)