TokenizerManager.context_len should inherit from `server_args.conte… (#654)
This commit is contained in:
@@ -69,6 +69,9 @@ class TokenizerManager:
|
|||||||
trust_remote_code=server_args.trust_remote_code,
|
trust_remote_code=server_args.trust_remote_code,
|
||||||
model_overide_args=model_overide_args,
|
model_overide_args=model_overide_args,
|
||||||
)
|
)
|
||||||
|
if server_args.context_length is not None:
|
||||||
|
self.context_len = server_args.context_length
|
||||||
|
else:
|
||||||
self.context_len = get_context_length(self.hf_config)
|
self.context_len = get_context_length(self.hf_config)
|
||||||
|
|
||||||
if is_multimodal_model(self.model_path):
|
if is_multimodal_model(self.model_path):
|
||||||
|
|||||||
Reference in New Issue
Block a user