Fix chunked prefill size for bench_offline_throughput (#2234)

This commit is contained in:
Lianmin Zheng
2024-11-27 23:37:20 -08:00
committed by GitHub
parent b79fffdcb5
commit 09798b36cd

View File

@@ -144,7 +144,7 @@ class ServerArgs:
if self.served_model_name is None:
self.served_model_name = self.model_path
if self.chunked_prefill_size <= 0:
if self.chunked_prefill_size is not None and self.chunked_prefill_size <= 0:
# Disable chunked prefill
self.chunked_prefill_size = None