Support incremental streaming of logprob/token_ids between scheduler and detokenizer (#6225)
Co-authored-by: SangBin Cho <rkooo567@gmail.com>
This commit is contained in:
@@ -41,7 +41,7 @@ class BaseGrammarObject:
|
||||
raise NotImplementedError()
|
||||
|
||||
def is_terminated(self):
|
||||
raise NotImplementedError()
|
||||
return False
|
||||
|
||||
def allocate_vocab_mask(
|
||||
self, vocab_size: int, batch_size: int, device
|
||||
|
||||
Reference in New Issue
Block a user