[API, Feature] Support response prefill for openai API (#1490)
This commit is contained in:
@@ -27,7 +27,7 @@ class TestOpenAIServer(unittest.TestCase):
|
||||
cls.base_url,
|
||||
timeout=DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH,
|
||||
api_key=cls.api_key,
|
||||
other_args=("--max-total-token", "1024"),
|
||||
other_args=("--max-total-token", "1024", "--context-len", "8192"),
|
||||
env={"SGLANG_CLIP_MAX_NEW_TOKENS": "256", **os.environ},
|
||||
return_stdout_stderr=True,
|
||||
)
|
||||
|
||||
Reference in New Issue
Block a user