From 11e710dd3f8967a5e3b79b59028b1a0e065b5fe9 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Mon, 22 Jun 2026 03:07:13 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: xiaowangge/minicpm4-8b-gguf Source: Original Platform --- .gitattributes | 47 ++++++++++++++++++++ README.md | 98 +++++++++++++++++++++++++++++++++++++++++ configuration.json | 1 + minicpm4-8b-fp16.gguf | 3 ++ minicpm4-8b-q4_K_M.gguf | 3 ++ minicpm4-8b-q8_0.gguf | 3 ++ 6 files changed, 155 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 configuration.json create mode 100644 minicpm4-8b-fp16.gguf create mode 100644 minicpm4-8b-q4_K_M.gguf create mode 100644 minicpm4-8b-q8_0.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..53d7257 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bin.* filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.gguf* filter=lfs diff=lfs merge=lfs -text +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..21dcf71 --- /dev/null +++ b/README.md @@ -0,0 +1,98 @@ +--- +frameworks: +- Pytorch +license: Apache License 2.0 +tasks: +- text-generation + +#model-type: +##如 gpt、phi、llama、chatglm、baichuan 等 +#- gpt + +#domain: +##如 nlp、cv、audio、multi-modal +#- nlp + +#language: +##语言代码列表 https://help.aliyun.com/document_detail/215387.html?spm=a2c4g.11186623.0.0.9f8d7467kni6Aa +#- cn + +#metrics: +##如 CIDEr、Blue、ROUGE 等 +#- CIDEr + +#tags: +##各种自定义,包括 pretrained、fine-tuned、instruction-tuned、RL-tuned 等训练方法和其他 +#- pretrained + +#tools: +##如 vllm、fastchat、llamacpp、AdaSeq 等 +#- vllm +language: + - zh + - en +base_model: + - OpenBMB/MiniCPM4-8B +base_model_relation: quantized +--- + + +### 介绍 + +1. 该模型基于 `https://www.modelscope.cn/models/OpenBMB/MiniCPM4-8B` 转换。 +2. 开源许可遵循 `MiniCPM4-8B`。 + +### 模型下载 + +#### SDK 下载 + +```bash +# 安装 ModelScope +pip install modelscope +``` +```python +# SDK模型下载 +from modelscope import snapshot_download +model_dir = snapshot_download('xiaowangge/minicpm4-8b-gguf') +``` +#### Git 下载 + +``` +# Git模型下载 +git clone https://www.modelscope.cn/xiaowangge/minicpm4-8b-gguf.git +``` + +### 快速开始 + +> 本地构建或下载预构建形式的 `llama.cpp` 文件,使用 `llama-cli` 推理。 + +#### 源码构建 llama-cli +```bash +# 克隆 llama.cpp 源码 +git clone -b https://github.com/ggml-org/llama.cpp +# 进入目录 +cd llama.cpp +# 构建配置,开启 CUDA 加速,禁用 CURL +cmake -B build -DGGML_CUDA=ON -DLLAMA_CURL=OFF +# 多任务加速构建 +cmake --build build --config Release -j 10 +# 测试 +build/bin/llama-cli -h +``` + +#### llama-cli 推理 + +```bash +# GPU 加速 +build/bin/llama-cli -m ./minicpm4-8b-fp16.gguf -c 1024 -ngl 128 -n 512 -p "介绍下你自己" +``` + +#### ollama 推理 + +> 如果不想进行复杂的 `llama.cpp `编译或配置,可使用 `ollama(version>=0.9.2)` 快速推理。 + +```bash +ollama run xiaowangge/minicpm4 +``` + + diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..f9291c3 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework":"Pytorch","task":"text-generation"} \ No newline at end of file diff --git a/minicpm4-8b-fp16.gguf b/minicpm4-8b-fp16.gguf new file mode 100644 index 0000000..0b0248c --- /dev/null +++ b/minicpm4-8b-fp16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfe621d49d5cc5cee17043f5c96e93c00bd1c596f4ee140fe3baeb8366cc00d0 +size 16372735296 diff --git a/minicpm4-8b-q4_K_M.gguf b/minicpm4-8b-q4_K_M.gguf new file mode 100644 index 0000000..b0e42d3 --- /dev/null +++ b/minicpm4-8b-q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb5f071bf493b73029cbf190344cec01a599fafcc22e80de6361c396ddac07b +size 4965526080 diff --git a/minicpm4-8b-q8_0.gguf b/minicpm4-8b-q8_0.gguf new file mode 100644 index 0000000..affca64 --- /dev/null +++ b/minicpm4-8b-q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54bc78f66953d50e0c1a18bab8db71a283ebd7e366178f79d415388990a8adcc +size 8699309376