forked from EngineX-Cambricon/enginex-mlu370-vllm
add dynamic register
This commit is contained in:
@@ -274,7 +274,13 @@ class ModelConfig:
|
||||
self, limit_mm_per_prompt: Optional[Mapping[str, int]]
|
||||
) -> Optional["MultiModalConfig"]:
|
||||
architectures = getattr(self.hf_config, "architectures", [])
|
||||
if ModelRegistry.is_multimodal_model(architectures):
|
||||
if ModelRegistry.is_multimodal_model(
|
||||
architectures,
|
||||
model_path=self.model,
|
||||
revision=self.revision,
|
||||
trust_remote_code=self.trust_remote_code,
|
||||
hf_config=self.hf_config,
|
||||
):
|
||||
return MultiModalConfig(limit_per_prompt=limit_mm_per_prompt or {})
|
||||
|
||||
if limit_mm_per_prompt:
|
||||
@@ -308,11 +314,23 @@ class ModelConfig:
|
||||
|
||||
def _init_attention_free(self) -> bool:
|
||||
architectures = getattr(self.hf_config, "architectures", [])
|
||||
return ModelRegistry.is_attention_free_model(architectures)
|
||||
return ModelRegistry.is_attention_free_model(
|
||||
architectures,
|
||||
model_path=self.model,
|
||||
revision=self.revision,
|
||||
trust_remote_code=self.trust_remote_code,
|
||||
hf_config=self.hf_config,
|
||||
)
|
||||
|
||||
def _init_has_inner_state(self) -> bool:
|
||||
architectures = getattr(self.hf_config, "architectures", [])
|
||||
return ModelRegistry.model_has_inner_state(architectures)
|
||||
return ModelRegistry.model_has_inner_state(
|
||||
architectures,
|
||||
model_path=self.model,
|
||||
revision=self.revision,
|
||||
trust_remote_code=self.trust_remote_code,
|
||||
hf_config=self.hf_config,
|
||||
)
|
||||
|
||||
def _verify_tokenizer_mode(self) -> None:
|
||||
tokenizer_mode = self.tokenizer_mode.lower()
|
||||
|
||||
Reference in New Issue
Block a user