add deepseekv3 and llama4

This commit is contained in:
Chranos
2026-02-11 15:24:13 +08:00
parent 2ad23aa8da
commit c584139543
5 changed files with 320 additions and 9 deletions

View File

@@ -166,6 +166,7 @@ _SPECULATIVE_DECODING_MODELS = {
"EAGLEModel": ("eagle", "EAGLE"),
"MedusaModel": ("medusa", "Medusa"),
"MLPSpeculatorPreTrainedModel": ("mlp_speculator", "MLPSpeculator"),
"DeepSeekMTPModel": ("deepseek_mtp", "DeepSeekMTP"),
}
# Transformers backend models - wrapper classes for custom HuggingFace models