From c977d42ab26f726cd282cbb15b6046ee87d8fca2 Mon Sep 17 00:00:00 2001
From: zhousha <736730048@qq.com>
Date: Thu, 4 Dec 2025 20:17:51 +0800
Subject: [PATCH] update
---
README.md | 15 +++++++++++++--
enginex/BLIP3o-Model.md | 18 ++++++++++++++++++
enginex/DeepSeek-OCR.md | 9 ---------
enginex/Florence-2-large-ft.md | 9 +++++++++
enginex/Kimi-VL-A3B-Instruct.md | 13 +++++++++++++
enginex/Kimi-VL-A3B-Thinking.md | 13 +++++++++++++
enginex/Marco-o1.md | 11 +++++++++++
enginex/MiniCPM-V-2_6.md | 12 ++++++++++++
enginex/OmniParser.md | 11 +++++++++++
enginex/Ovis1.6-Gemma2-9B.md | 11 +++++++++++
enginex/VITA-1.5.md | 15 +++++++++++++++
enginex/llava-v1.5-7b.md | 10 ++++++++++
enginex/mini-omni2.md | 15 +++++++++++++++
enginex/var.md | 13 +++++++++++++
14 files changed, 164 insertions(+), 11 deletions(-)
create mode 100644 enginex/BLIP3o-Model.md
delete mode 100644 enginex/DeepSeek-OCR.md
create mode 100644 enginex/Florence-2-large-ft.md
create mode 100644 enginex/Kimi-VL-A3B-Instruct.md
create mode 100644 enginex/Kimi-VL-A3B-Thinking.md
create mode 100644 enginex/Marco-o1.md
create mode 100644 enginex/MiniCPM-V-2_6.md
create mode 100644 enginex/OmniParser.md
create mode 100644 enginex/Ovis1.6-Gemma2-9B.md
create mode 100644 enginex/VITA-1.5.md
create mode 100644 enginex/llava-v1.5-7b.md
create mode 100644 enginex/mini-omni2.md
create mode 100644 enginex/var.md
diff --git a/README.md b/README.md
index 6465f9a..5868b72 100644
--- a/README.md
+++ b/README.md
@@ -10,9 +10,20 @@
支持模型列表:
- deepseek-ai/Janus-Pro-7B
- PaddlePaddle/PaddleOCR-VL
-- deepseek-ai/DeepSeek-OCR
- Qwen/Qwen2.5-7B-instruct
- Qwen/Qwen2-VL-2B-Instruct
- ZhipuAI/glm-4v-9b
- LLM-Research/gemma-3-27b-it
-- stepfun-ai/step3
\ No newline at end of file
+- stepfun-ai/step3
+- OpenBMB/MiniCPM-V
+- huangjianuo/llava-v1.5-7b
+- gpt-omni/mini-omni2
+- FoundationVision/var
+- AIDC-AI/Ovis1.6-Gemma2-9B
+- VITA-MLLM/VITA-1.5
+- AIDC-AI/Marco-o1
+- moonshotai/Kimi-VL-A3B-Thinking
+- AI-ModelScope/Florence-2-large-ft
+- BLIP3o/BLIP3o-Model
+- AI-ModelScope/OmniParser
+- moonshotai/Kimi-VL-A3B-Instruct
\ No newline at end of file
diff --git a/enginex/BLIP3o-Model.md b/enginex/BLIP3o-Model.md
new file mode 100644
index 0000000..353f39e
--- /dev/null
+++ b/enginex/BLIP3o-Model.md
@@ -0,0 +1,18 @@
+# 运行方式
+
+```python
+docker pull git.modelhub.org.cn:9443/enginex-hygon/pytorch:2.4.1-ubuntu22.04-dtk25.04-py3.10-fixpy
+# 为以上拉取的docker的镜像ID替换,本镜像为:6063b673703a
+docker run -it --shm-size=64G -v $PWD/BLIP3o:/home/BLIP3o -v /opt/hyhal:/opt/hyhal:ro --privileged=true --device=/dev/kfd --device=/dev/dri/ --group-add video --name blip3o bash
+
+cd /home/BLIP3o
+pip install -r requirements.txt -i https://mirrors.aliyun.com/pypi/simple
+pip install whl/bitsandbytes-0.42.0+das.opt1.dtk2504-py3-none-any.whl # bitsandbytes==0.42
+pip install whl/torchaudio-2.1.2+das.opt2.dtk24043-cp310-cp310-manylinux_2_28_x86_64.whl # torchaudio==2.1.2
+
+cd diffusers
+pip install -e . -i https://mirrors.aliyun.com/pypi/simple # diffusers==0.32.2
+
+cd /home/BLIP3o
+pip install -e . -i https://mirrors.aliyun.com/pypi/simple # blip3o==0.1.0
+```
diff --git a/enginex/DeepSeek-OCR.md b/enginex/DeepSeek-OCR.md
deleted file mode 100644
index fb6de17..0000000
--- a/enginex/DeepSeek-OCR.md
+++ /dev/null
@@ -1,9 +0,0 @@
-# 运行方式
-
-```python
-docker pull git.modelhub.org.cn:9443/enginex-hygon/vllm:0.8.5-ubuntu22.04-dtk25.04.1-rc5-das1.6-py3.10-20250724
-docker run -it --shm-size 200g --network=host --name {docker_name} --privileged --device=/dev/kfd --device=/dev/dri --device=/dev/mkfd --group-add video --cap-add=SYS_PTRACE --security-opt seccomp=unconfined -u root -v /path/your_code_data/:/path/your_code_data/ -v /opt/hyhal/:/opt/hyhal/:ro {imageID} bash
-
-cd /your_code_path/deepseek-ocr_pytorch
-
-```
diff --git a/enginex/Florence-2-large-ft.md b/enginex/Florence-2-large-ft.md
new file mode 100644
index 0000000..eb2d997
--- /dev/null
+++ b/enginex/Florence-2-large-ft.md
@@ -0,0 +1,9 @@
+# 运行方式
+
+```python
+docker pull git.modelhub.org.cn:9443/enginex-hygon/pytorch:2.4.1-ubuntu22.04-dtk25.04-py3.10-fixpy
+# 为以上拉取的docker的镜像ID替换,本镜像为:6063b673703a
+docker run -it --shm-size=64G -v $PWD/Florence-2-Vision-Language-Model:/home/Florence-2-Vision-Language-Model -v /opt/hyhal:/opt/hyhal:ro --privileged=true --device=/dev/kfd --device=/dev/dri/ --group-add video --name florence2 bash
+cd /home/Florence-2-Vision-Language-Model
+pip install -r requirements.txt -i https://mirrors.aliyun.com/pypi/simple
+```
diff --git a/enginex/Kimi-VL-A3B-Instruct.md b/enginex/Kimi-VL-A3B-Instruct.md
new file mode 100644
index 0000000..f528814
--- /dev/null
+++ b/enginex/Kimi-VL-A3B-Instruct.md
@@ -0,0 +1,13 @@
+# 运行方式
+
+```python
+docker pull git.modelhub.org.cn:9443/enginex-hygon/pytorch:2.3.0-py3.10-dtk24.04.3-ubuntu20.04
+
+docker run -it --shm-size=1024G -v /path/your_code_data/:/path/your_code_data/ -v /opt/hyhal:/opt/hyhal --network=host --privileged=true --device=/dev/kfd --device=/dev/dri/ --group-add video --name kimi-vl bash # 为以上拉取的docker的镜像ID替换
+
+git clone http://developer.sourcefind.cn/codes/modelzoo/kimi-vl-a3b-instruct_pytorch.git
+
+cd /path/your_code_data/
+
+pip install -r requirements.txt -i https://pypi.tuna.tsinghua.edu.cn/simple
+```
diff --git a/enginex/Kimi-VL-A3B-Thinking.md b/enginex/Kimi-VL-A3B-Thinking.md
new file mode 100644
index 0000000..aeb4133
--- /dev/null
+++ b/enginex/Kimi-VL-A3B-Thinking.md
@@ -0,0 +1,13 @@
+# 运行方式
+
+```python
+docker pull git.modelhub.org.cn:9443/enginex-hygon/pytorch:2.3.0-py3.10-dtk24.04.3-ubuntu20.04
+
+docker run -it --shm-size=1024G -v /path/your_code_data/:/path/your_code_data/ -v /opt/hyhal:/opt/hyhal --network=host --privileged=true --device=/dev/kfd --device=/dev/dri/ --group-add video --name kimi-vl-thinking bash # 为以上拉取的docker的镜像ID替换
+
+git clone http://developer.sourcefind.cn/codes/modelzoo/kimi-vl-a3b-thinking_pytorch.git
+
+cd /path/your_code_data/
+
+pip install -r requirements.txt -i https://pypi.tuna.tsinghua.edu.cn/simple
+```
diff --git a/enginex/Marco-o1.md b/enginex/Marco-o1.md
new file mode 100644
index 0000000..98c2bf7
--- /dev/null
+++ b/enginex/Marco-o1.md
@@ -0,0 +1,11 @@
+# 运行方式
+
+```python
+docker pull git.modelhub.org.cn:9443/enginex-hygon/pytorch:2.3.0-py3.10-dtk24.04.3-ubuntu20.04
+# 为以上拉取的docker的镜像ID替换,本镜像为:b272aae8ec72
+docker run -it --shm-size=64G -v $PWD/Marco-o1:/home/Marco-o1 -v /opt/hyhal:/opt/hyhal:ro --privileged=true --device=/dev/kfd --device=/dev/dri/ --group-add video --name marcoo1 bash
+cd /home/Marco-o1
+pip install -r requirements.txt
+pip install whl/lmslim-0.1.2+das.dtk24043-cp310-cp310-linux_x86_64.whl # 安装lmslim==0.1.2
+pip install whl/vllm-0.6.2+das.opt1.cd549d3.dtk24043-cp310-cp310-linux_x86_64.whl # 安装vllm==0.6.2
+```
diff --git a/enginex/MiniCPM-V-2_6.md b/enginex/MiniCPM-V-2_6.md
new file mode 100644
index 0000000..d916e87
--- /dev/null
+++ b/enginex/MiniCPM-V-2_6.md
@@ -0,0 +1,12 @@
+# 运行方式
+
+```python
+docker pull git.modelhub.org.cn:9443/enginex-hygon/pytorch:2.3.0-py3.10-dtk24.04.3-ubuntu20.04
+docker run -it --shm-size=1024G -v /path/your_code_data/:/path/your_code_data/ -v /opt/hyhal:/opt/hyhal --network=host --privileged=true --device=/dev/kfd --device=/dev/dri/ --group-add video --name minicpm_v bash # 为以上拉取的docker的镜像ID替换
+
+git clone http://developer.sourcefind.cn/codes/modelzoo/minicpm-v-2_6_pytorch.git
+
+cd /path/your_code_data/
+
+pip install -r requirements.txt -i https://pypi.tuna.tsinghua.edu.cn/simple
+```
diff --git a/enginex/OmniParser.md b/enginex/OmniParser.md
new file mode 100644
index 0000000..a8f07f6
--- /dev/null
+++ b/enginex/OmniParser.md
@@ -0,0 +1,11 @@
+# 运行方式
+
+```python
+docker pull git.modelhub.org.cn:9443/enginex-hygon/pytorch:2.3.0-ubuntu22.04-dtk24.04.3-py3.10
+
+docker run --shm-size 50g --network=host --name=dpskr1 --privileged --device=/dev/kfd --device=/dev/dri --group-add video --cap-add=SYS_PTRACE --security-opt seccomp=unconfined -v 项目地址(绝对路径):/home/ -v /opt/hyhal:/opt/hyhal:ro -it bash
+
+pip install https://download.sourcefind.cn:65024/directlink/4/paddle/DAS1.3/paddlepaddle-2.6.1+das.opt1.dtk24043-cp310-cp310-manylinux_2_28_x86_64.whl
+
+pip install -r requirements.txt
+```
diff --git a/enginex/Ovis1.6-Gemma2-9B.md b/enginex/Ovis1.6-Gemma2-9B.md
new file mode 100644
index 0000000..0e44d0a
--- /dev/null
+++ b/enginex/Ovis1.6-Gemma2-9B.md
@@ -0,0 +1,11 @@
+# 运行方式
+
+```python
+docker pull git.modelhub.org.cn:9443/enginex-hygon/pytorch:2.1.0-ubuntu20.04-dtk24.04.1-py3.10
+docker run -it --shm-size=1024G -v /path/your_code_data/:/path/your_code_data/ -v /opt/hyhal:/opt/hyhal --privileged=true --device=/dev/kfd --device=/dev/dri/ --group-add video --name ovis_pytorch bash # 为以上拉取的docker的镜像ID替换,本镜像为:a4dd5be0ca23
+cd /path/your_code_data/
+pip install -r requirements.txt -i https://mirrors.aliyun.com/pypi/simple/ --trusted-host mirrors.aliyun.com
+pip install --no-deps -e .
+cd VLMEvalKit
+pip install e .
+```
diff --git a/enginex/VITA-1.5.md b/enginex/VITA-1.5.md
new file mode 100644
index 0000000..37048be
--- /dev/null
+++ b/enginex/VITA-1.5.md
@@ -0,0 +1,15 @@
+# 运行方式
+
+```python
+docker pull git.modelhub.org.cn:9443/enginex-hygon/pytorch:2.3.0-ubuntu22.04-dtk24.04.2-py3.10
+# 为以上拉取的docker的镜像ID替换,本镜像为:83714c19d308
+docker run -it --shm-size=64G -v $PWD/VITA:/home/VITA -v /opt/hyhal:/opt/hyhal:ro --privileged=true --device=/dev/kfd --device=/dev/dri/ --group-add video --name vita bash
+cd /home/VITA
+pip install -r requirements.txt # requirements.txt
+# 安装torchaudio读取音频所需的ffmpeg-4.4.4
+sh ffmpeg_env.sh
+# 安装gradio
+pip install gradio==5.4.0 # gradio
+cp -r frpc_linux_amd64 /usr/local/lib/python3.10/site-packages/gradio/frpc_linux_amd64_v0.3
+chmod +x /usr/local/lib/python3.10/site-packages/gradio/frpc_linux_amd64_v0.3
+```
diff --git a/enginex/llava-v1.5-7b.md b/enginex/llava-v1.5-7b.md
new file mode 100644
index 0000000..fc462e2
--- /dev/null
+++ b/enginex/llava-v1.5-7b.md
@@ -0,0 +1,10 @@
+# 运行方式
+
+```python
+docker pull git.modelhub.org.cn:9443/enginex-hygon/pytorch:2.3.0-ubuntu22.04-dtk24.04.3-py3.10
+#
用上面拉取docker镜像的ID替换
+# 主机端路径
+# 容器映射路径
+# 若要在主机端和容器端映射端口需要删除--network host参数
+docker run -it --name llava_vllm --privileged --shm-size=64G --device=/dev/kfd --device=/dev/dri/ --cap-add=SYS_PTRACE --security-opt seccomp=unconfined --ulimit memlock=-1:-1 --ipc=host --network host --group-add video -v /opt/hyhal:/opt/hyhal -v :
/bin/bash
+```
diff --git a/enginex/mini-omni2.md b/enginex/mini-omni2.md
new file mode 100644
index 0000000..7aeae9a
--- /dev/null
+++ b/enginex/mini-omni2.md
@@ -0,0 +1,15 @@
+# 运行方式
+
+```python
+docker pull git.modelhub.org.cn:9443/enginex-hygon/pytorch:2.3.0-ubuntu22.04-dtk24.04.2-py3.10
+# 为以上拉取的docker的镜像ID替换,本镜像为:83714c19d308
+docker run -it --shm-size=64G -v $PWD/mini-omni2:/home/mini-omni2 -v /opt/hyhal:/opt/hyhal:ro --privileged=true --device=/dev/kfd --device=/dev/dri/ --group-add video --name omni2 bash
+cd /home/mini-omni2
+pip install -r requirements.txt # requirements.txt
+# 安装ffmpeg
+apt update
+apt-get install ffmpeg
+# 安装CLIP
+cd CLIP
+pip install . #clip==1.0
+```
diff --git a/enginex/var.md b/enginex/var.md
new file mode 100644
index 0000000..30db6b7
--- /dev/null
+++ b/enginex/var.md
@@ -0,0 +1,13 @@
+# 运行方式
+
+```python
+docker pull git.modelhub.org.cn:9443/enginex-hygon/pytorch:2.1.0-ubuntu20.04-dtk24.04.1-py3.10
+docker run -it --network=host --privileged=true --name=var --device=/dev/kfd --device=/dev/dri --group-add video --shm-size=32G --cap-add=SYS_PTRACE --security-opt seccomp=unconfined -v /path/your_code_data/:/path/your_code_data/ -v /opt/hyhal/:/opt/hyhal/:ro /bin/bash # 为以上拉取的docker的镜像ID替换
+
+cd /your_code_path/VAR
+pip config set global.index-url https://pypi.tuna.tsinghua.edu.cn/simple
+pip install -r requirements.txt
+wget https://download.sourcefind.cn:65024/directlink/4/flash_attn/DAS1.1/flash_attn-2.0.4+das1.1gitc7a8c18.abi1.dtk2404.torch2.1-cp310-cp310-manylinux_2_31_x86_64.whl
+pip install flash_attn-2.0.4+das1.1gitc7a8c18.abi1.dtk2404.torch2.1-cp310-cp310-manylinux_2_31_x86_64.whl
+git config --global --add safe.directory /your_code_path/VAR
+```