[PD] Support prefill overlap + Ensure no race condition (#5609)

This commit is contained in:
Byron Hsu
2025-04-21 12:12:56 -07:00
committed by GitHub
parent e65b9f21e3
commit bf98d2e377
5 changed files with 107 additions and 18 deletions

View File

@@ -2014,7 +2014,10 @@ def run_scheduler_process(
else:
scheduler.event_loop_normal()
elif disaggregation_mode == DisaggregationMode.PREFILL:
scheduler.event_loop_normal_disagg_prefill()
if scheduler.enable_overlap:
scheduler.event_loop_overlap_disagg_prefill()
else:
scheduler.event_loop_normal_disagg_prefill()
elif disaggregation_mode == DisaggregationMode.DECODE:
if scheduler.enable_overlap:
scheduler.event_loop_overlap_disagg_decode()