Remove prompt string from engine core data structures (#663)
### What this PR does / why we need it?
vLLM Ascend side followup on:
[Core] Remove prompt string from engine core data structures
df6f3ce883
### Does this PR introduce _any_ user-facing change?
No
### How was this patch tested?
CI passed
Signed-off-by: Yikun Jiang <yikunkero@gmail.com>
This commit is contained in:
@@ -346,7 +346,7 @@ class NPUModelRunner:
|
|||||||
generator.manual_seed(sampling_params.seed)
|
generator.manual_seed(sampling_params.seed)
|
||||||
else:
|
else:
|
||||||
generator = None
|
generator = None
|
||||||
|
if vllm_version_is("0.8.4"):
|
||||||
self.requests[req_id] = CachedRequestState(
|
self.requests[req_id] = CachedRequestState(
|
||||||
req_id=req_id,
|
req_id=req_id,
|
||||||
prompt_token_ids=new_req_data.prompt_token_ids,
|
prompt_token_ids=new_req_data.prompt_token_ids,
|
||||||
@@ -360,6 +360,20 @@ class NPUModelRunner:
|
|||||||
output_token_ids=[],
|
output_token_ids=[],
|
||||||
lora_request=new_req_data.lora_request,
|
lora_request=new_req_data.lora_request,
|
||||||
)
|
)
|
||||||
|
else:
|
||||||
|
# the prompt removed by: https://github.com/vllm-project/vllm/pull/17214
|
||||||
|
self.requests[req_id] = CachedRequestState(
|
||||||
|
req_id=req_id,
|
||||||
|
prompt_token_ids=new_req_data.prompt_token_ids,
|
||||||
|
mm_inputs=new_req_data.mm_inputs,
|
||||||
|
mm_positions=new_req_data.mm_positions,
|
||||||
|
sampling_params=sampling_params,
|
||||||
|
generator=generator,
|
||||||
|
block_ids=new_req_data.block_ids,
|
||||||
|
num_computed_tokens=new_req_data.num_computed_tokens,
|
||||||
|
output_token_ids=[],
|
||||||
|
lora_request=new_req_data.lora_request,
|
||||||
|
)
|
||||||
|
|
||||||
req_ids_to_add.append(req_id)
|
req_ids_to_add.append(req_id)
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user