forked from EngineX-Cambricon/enginex-mlu370-vllm
add deepseekv3 and llama4
This commit is contained in:
@@ -60,6 +60,7 @@ class MLUWorker(Worker):
|
|||||||
speculative_config = self.speculative_config
|
speculative_config = self.speculative_config
|
||||||
model_config = self.model_config
|
model_config = self.model_config
|
||||||
is_mtp = (speculative_config is not None
|
is_mtp = (speculative_config is not None
|
||||||
|
and model_config.task != "draft"
|
||||||
and getattr(
|
and getattr(
|
||||||
speculative_config.draft_model_config.hf_config,
|
speculative_config.draft_model_config.hf_config,
|
||||||
"model_type", None) == "deepseek_mtp")
|
"model_type", None) == "deepseek_mtp")
|
||||||
|
|||||||
Reference in New Issue
Block a user