DP Attention with Auto DeepEP Dispatch (#7222)
This commit is contained in:
@@ -772,7 +772,7 @@ class SchedulerDisaggregationDecodeMixin:
|
||||
self.last_batch_in_queue = last_batch_in_queue
|
||||
|
||||
def _prepare_idle_batch_and_run(self: Scheduler, batch, delay_process=False):
|
||||
batch, _ = self.prepare_mlp_sync_batch(batch)
|
||||
batch = self.prepare_mlp_sync_batch(batch)
|
||||
result = None
|
||||
if batch:
|
||||
result = self.run_batch(batch)
|
||||
|
||||
@@ -276,7 +276,7 @@ class SchedulerDisaggregationPrefillMixin:
|
||||
batch = self.get_new_batch_prefill()
|
||||
|
||||
if require_mlp_sync(self.server_args):
|
||||
batch, _ = self.prepare_mlp_sync_batch(batch)
|
||||
batch = self.prepare_mlp_sync_batch(batch)
|
||||
self.cur_batch = batch
|
||||
|
||||
if batch:
|
||||
@@ -310,7 +310,7 @@ class SchedulerDisaggregationPrefillMixin:
|
||||
batch = self.get_new_batch_prefill()
|
||||
|
||||
if require_mlp_sync(self.server_args):
|
||||
batch, _ = self.prepare_mlp_sync_batch(batch)
|
||||
batch = self.prepare_mlp_sync_batch(batch)
|
||||
self.cur_batch = batch
|
||||
if batch:
|
||||
result = self.run_batch(batch)
|
||||
|
||||
Reference in New Issue
Block a user