diff --git a/vllm_ascend/distributed/kv_transfer/kv_pool/ascend_store/pool_scheduler.py b/vllm_ascend/distributed/kv_transfer/kv_pool/ascend_store/pool_scheduler.py index 80468456..2629b695 100644 --- a/vllm_ascend/distributed/kv_transfer/kv_pool/ascend_store/pool_scheduler.py +++ b/vllm_ascend/distributed/kv_transfer/kv_pool/ascend_store/pool_scheduler.py @@ -78,6 +78,9 @@ class KVPoolScheduler: else: token_len = len(request.prompt_token_ids) + if token_len < self._block_size: + return 0, False + num_external_hit_tokens = self.client.lookup(token_len, request.block_hashes) if num_external_hit_tokens == request.num_tokens: