diff --git a/python/sglang/srt/disaggregation/prefill.py b/python/sglang/srt/disaggregation/prefill.py index c6020767b..cdd1676a8 100644 --- a/python/sglang/srt/disaggregation/prefill.py +++ b/python/sglang/srt/disaggregation/prefill.py @@ -226,6 +226,11 @@ class SchedulerDisaggregationPrefillMixin: elif poll == KVPoll.Failed: raise Exception("Transferring failed") + for req in done_reqs: + self.disagg_prefill_pending_queue.req_to_metadata_buffer_idx_allocator.free( + req.metadata_buffer_index + ) + # Stream requests which have finished transfer self.stream_output(done_reqs, False, None)