Test the case when max_new_tokens is very large (#1038)

This commit is contained in:
Lianmin Zheng
2024-08-11 16:41:03 -07:00
committed by GitHub
parent d785412077
commit d84c5e70f7
7 changed files with 100 additions and 14 deletions

View File

@@ -64,7 +64,7 @@ class ServerArgs:
# Other
api_key: Optional[str] = None
file_storage_pth: str = "SGlang_storage"
file_storage_pth: str = "SGLang_storage"
# Data parallelism
dp_size: int = 1