diff --git a/python/sglang/srt/server_args.py b/python/sglang/srt/server_args.py index e7a102c91..ab28e5abe 100644 --- a/python/sglang/srt/server_args.py +++ b/python/sglang/srt/server_args.py @@ -324,12 +324,6 @@ class ServerArgs: if self.grammar_backend is None: self.grammar_backend = "xgrammar" - if self.pp_size > 1: - self.disable_overlap_schedule = True - logger.warning( - "Overlap scheduler is disabled because of using pipeline parallelism." - ) - # Data parallelism attention if self.enable_dp_attention: self.schedule_conservativeness = self.schedule_conservativeness * 0.3 @@ -1444,8 +1438,6 @@ class ServerArgs: # FIXME pp constraints if self.pp_size > 1: - logger.warning(f"Turn off overlap scheule for pipeline parallelism.") - self.disable_overlap_schedule = True assert ( self.disable_overlap_schedule and self.speculative_algorithm is None