fix missing revision arg when loading tokenizer (#2982)

This commit is contained in:
giorgiopiatti-dfinity
2025-01-19 20:36:07 +01:00
committed by GitHub
parent a69cb5cff7
commit 8b6a4486ec
5 changed files with 8 additions and 0 deletions

View File

@@ -71,6 +71,7 @@ class DetokenizerManager:
server_args.tokenizer_path, server_args.tokenizer_path,
tokenizer_mode=server_args.tokenizer_mode, tokenizer_mode=server_args.tokenizer_mode,
trust_remote_code=server_args.trust_remote_code, trust_remote_code=server_args.trust_remote_code,
revision=server_args.revision,
) )
self.decode_status = LimitedCapacityDict() self.decode_status = LimitedCapacityDict()

View File

@@ -206,6 +206,7 @@ class Scheduler:
server_args.tokenizer_path, server_args.tokenizer_path,
tokenizer_mode=server_args.tokenizer_mode, tokenizer_mode=server_args.tokenizer_mode,
trust_remote_code=server_args.trust_remote_code, trust_remote_code=server_args.trust_remote_code,
revision=server_args.revision,
) )
self.tokenizer = self.processor.tokenizer self.tokenizer = self.processor.tokenizer
else: else:
@@ -213,6 +214,7 @@ class Scheduler:
server_args.tokenizer_path, server_args.tokenizer_path,
tokenizer_mode=server_args.tokenizer_mode, tokenizer_mode=server_args.tokenizer_mode,
trust_remote_code=server_args.trust_remote_code, trust_remote_code=server_args.trust_remote_code,
revision=server_args.revision,
) )
# Check whether overlap can be enabled # Check whether overlap can be enabled

View File

@@ -158,6 +158,7 @@ class TokenizerManager:
server_args.tokenizer_path, server_args.tokenizer_path,
tokenizer_mode=server_args.tokenizer_mode, tokenizer_mode=server_args.tokenizer_mode,
trust_remote_code=server_args.trust_remote_code, trust_remote_code=server_args.trust_remote_code,
revision=server_args.revision,
) )
self.tokenizer = self.processor.tokenizer self.tokenizer = self.processor.tokenizer
os.environ["TOKENIZERS_PARALLELISM"] = "false" os.environ["TOKENIZERS_PARALLELISM"] = "false"
@@ -171,6 +172,7 @@ class TokenizerManager:
server_args.tokenizer_path, server_args.tokenizer_path,
tokenizer_mode=server_args.tokenizer_mode, tokenizer_mode=server_args.tokenizer_mode,
trust_remote_code=server_args.trust_remote_code, trust_remote_code=server_args.trust_remote_code,
revision=server_args.revision,
) )
# Store states # Store states

View File

@@ -83,6 +83,7 @@ class TpModelWorker:
server_args.tokenizer_path, server_args.tokenizer_path,
tokenizer_mode=server_args.tokenizer_mode, tokenizer_mode=server_args.tokenizer_mode,
trust_remote_code=server_args.trust_remote_code, trust_remote_code=server_args.trust_remote_code,
revision=server_args.revision,
) )
self.tokenizer = self.processor.tokenizer self.tokenizer = self.processor.tokenizer
else: else:
@@ -90,6 +91,7 @@ class TpModelWorker:
server_args.tokenizer_path, server_args.tokenizer_path,
tokenizer_mode=server_args.tokenizer_mode, tokenizer_mode=server_args.tokenizer_mode,
trust_remote_code=server_args.trust_remote_code, trust_remote_code=server_args.trust_remote_code,
revision=server_args.revision,
) )
self.device = self.model_runner.device self.device = self.model_runner.device

View File

@@ -1027,6 +1027,7 @@ class Runtime:
self.server_args.tokenizer_path, self.server_args.tokenizer_path,
tokenizer_mode=self.server_args.tokenizer_mode, tokenizer_mode=self.server_args.tokenizer_mode,
trust_remote_code=self.server_args.trust_remote_code, trust_remote_code=self.server_args.trust_remote_code,
revision=self.server_args.revision,
) )
async def async_generate( async def async_generate(