From 09798b36cd31f8f9787cc43a5aed9bca173ada40 Mon Sep 17 00:00:00 2001 From: Lianmin Zheng Date: Wed, 27 Nov 2024 23:37:20 -0800 Subject: [PATCH] Fix chunked prefill size for bench_offline_throughput (#2234) --- python/sglang/srt/server_args.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sglang/srt/server_args.py b/python/sglang/srt/server_args.py index b545e00c0..144ade58e 100644 --- a/python/sglang/srt/server_args.py +++ b/python/sglang/srt/server_args.py @@ -144,7 +144,7 @@ class ServerArgs: if self.served_model_name is None: self.served_model_name = self.model_path - if self.chunked_prefill_size <= 0: + if self.chunked_prefill_size is not None and self.chunked_prefill_size <= 0: # Disable chunked prefill self.chunked_prefill_size = None