[v0.11.0-dev][CI] Fix ngram lacking of input arg dummy_compute_logits error (#4648)
### What this PR does / why we need it? Fix ngram lacking of input arg `dummy_compute_logits` error ### How was this patch tested? CI passed with existing test. --------- Signed-off-by: MengqingCao <cmq0113@163.com>
This commit is contained in:
@@ -35,7 +35,8 @@ class Proposer:
|
||||
num_reqs: int = 0,
|
||||
num_tokens_across_dp: Optional[torch.Tensor] = None,
|
||||
aclgraph_runtime_mode: CUDAGraphMode = CUDAGraphMode.NONE,
|
||||
batch_descriptor=None):
|
||||
batch_descriptor=None,
|
||||
dummy_compute_logits=lambda hidden_states: None):
|
||||
"""Called by dummy_run in modle_runner"""
|
||||
raise NotImplementedError
|
||||
|
||||
|
||||
@@ -26,7 +26,8 @@ class NgramProposer(VllmNgramProposer, Proposer):
|
||||
num_reqs=None,
|
||||
num_tokens_across_dp=None,
|
||||
aclgraph_runtime_mode: CUDAGraphMode = CUDAGraphMode.NONE,
|
||||
batch_descriptor=None):
|
||||
batch_descriptor=None,
|
||||
dummy_compute_logits=lambda hidden_states: None):
|
||||
pass
|
||||
|
||||
def generate_token_ids(self,
|
||||
|
||||
Reference in New Issue
Block a user