Enable chunked prefill by default (#1040)
This commit is contained in:
@@ -49,7 +49,7 @@ class ServerArgs:
|
||||
max_running_requests: Optional[int] = None
|
||||
max_num_reqs: Optional[int] = None
|
||||
max_total_tokens: Optional[int] = None
|
||||
chunked_prefill_size: int = -1
|
||||
chunked_prefill_size: int = 8192
|
||||
max_prefill_tokens: int = 16384
|
||||
schedule_policy: str = "lpm"
|
||||
schedule_conservativeness: float = 1.0
|
||||
|
||||
Reference in New Issue
Block a user