update vllm

This commit is contained in:
zhousha
2025-12-01 18:40:23 +08:00
parent ce7fc3b2c4
commit b1635efc43
15 changed files with 82 additions and 25 deletions

View File

@@ -9,19 +9,44 @@
支持模型列表:
- jina-embeddings-v3
- DeepSeek-R1_ollama
- DeepSeek-R1_pytorch
- DeepSeek-R1-Distill
- ChatGLM3-6B
- QwQ-32B
- DeepSeek-V3
- deepseek-ai/DeepSeek-R1
- Qwen/QwQ-32B
- deepseek-ai/DeepSeek-V3
- deepseek-ai/DeepSeek-V3.1
- LLaMA_Fastchat_pytorch
- Qwen3
- Qwen3-30B-A3B_vllm
- Qwen/Qwen3-30B-A3B
- Qwen-7B_fastllm
- ChatGLM-6B_fastllm
- ChatGLM-6B_pytorch
- ZhipuAI/ChatGLM-6B
- Shanghai_AI_Laboratory/internlm-chat-7b
- ZhipuAI/glm-4v-9b
- ZhipuAI/GLM-4-9B-0414
- deepseek-ai/DeepSeek-Coder-V2-Base
- openai-community/gpt2
- ZhipuAI/chatglm2-6b
- Qwen/Qwen-7B-Chat
- baichuan-inc/Baichuan2-13B-Chat
- ZhipuAI/chatglm3-6b
- deepseek-ai/DeepSeek-V2
- Qwen/Qwen2.5-Omni-7B
- deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
- deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
- deepseek-ai/DeepSeek-R1-Distill-Llama-8B
- deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
- deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
- deepseek-ai/DeepSeek-R1-Distill-Llama-70B
- LLM-Research/Meta-Llama-3-8B-Instruct
- Qwen/Qwen1.5-14B-Chat
- Qwen/Qwen2-7B
- Qwen/Qwen3-Embedding-0.6B
- baichuan-inc/baichuan-7B
- openai-community/gpt2
- gaodema/GME-Qwen2-VL
- OpenBMB/MiniCPM3-4B
- ZhipuAI/glm-10b-chinese
- 01ai/Yi-6B-Chat
- 01ai/Yi-34B-Chat