[PD] Support decode overlap schedule (#5608)

This commit is contained in:
Byron Hsu
2025-04-21 12:06:16 -07:00
committed by GitHub
parent 4dce1cc608
commit e65b9f21e3
3 changed files with 49 additions and 5 deletions

View File

@@ -2016,7 +2016,10 @@ def run_scheduler_process(
elif disaggregation_mode == DisaggregationMode.PREFILL:
scheduler.event_loop_normal_disagg_prefill()
elif disaggregation_mode == DisaggregationMode.DECODE:
scheduler.event_loop_normal_disagg_decode()
if scheduler.enable_overlap:
scheduler.event_loop_overlap_disagg_decode()
else:
scheduler.event_loop_normal_disagg_decode()
except Exception:
traceback = get_exception_traceback()