Fix chunked prefill size for bench_offline_throughput (#2234)
This commit is contained in:
@@ -144,7 +144,7 @@ class ServerArgs:
|
|||||||
if self.served_model_name is None:
|
if self.served_model_name is None:
|
||||||
self.served_model_name = self.model_path
|
self.served_model_name = self.model_path
|
||||||
|
|
||||||
if self.chunked_prefill_size <= 0:
|
if self.chunked_prefill_size is not None and self.chunked_prefill_size <= 0:
|
||||||
# Disable chunked prefill
|
# Disable chunked prefill
|
||||||
self.chunked_prefill_size = None
|
self.chunked_prefill_size = None
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user