diff --git a/python/sglang/srt/disaggregation/decode.py b/python/sglang/srt/disaggregation/decode.py index e4e3dde71..ece651b4e 100644 --- a/python/sglang/srt/disaggregation/decode.py +++ b/python/sglang/srt/disaggregation/decode.py @@ -158,7 +158,7 @@ class DecodePreallocQueue: preallocated_reqs = [] indices_to_remove = set() - allocatable_tokens = self._allocatable_tokens(count_retracted=True) + allocatable_tokens = self._allocatable_tokens() for i, decode_req in enumerate(self.queue): if not decode_req.waiting_for_input: