Initialize model_worker_batch variable (#1973)

This commit is contained in:
Enrique Shockwave
2024-11-09 19:28:02 +00:00
committed by GitHub
parent 95a4ed129a
commit f11eb90fe4

View File

@@ -787,8 +787,8 @@ class Scheduler:
self.forward_ct += 1
if self.is_generation:
model_worker_batch = batch.get_model_worker_batch()
if batch.forward_mode.is_decode() or batch.extend_num_tokens != 0:
model_worker_batch = batch.get_model_worker_batch()
batch.mark_reqs_started()
logits_output, next_token_ids = self.tp_worker.forward_batch_generation(
model_worker_batch