初始化项目,由ModelHub XC社区提供模型
Model: xiaowangge/minicpm4-8b-gguf Source: Original Platform
This commit is contained in:
47
.gitattributes
vendored
Normal file
47
.gitattributes
vendored
Normal file
@@ -0,0 +1,47 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
||||
*.tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
*.db* filter=lfs diff=lfs merge=lfs -text
|
||||
*.ark* filter=lfs diff=lfs merge=lfs -text
|
||||
**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text
|
||||
**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text
|
||||
**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.gguf* filter=lfs diff=lfs merge=lfs -text
|
||||
*.ggml filter=lfs diff=lfs merge=lfs -text
|
||||
*.llamafile* filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
98
README.md
Normal file
98
README.md
Normal file
@@ -0,0 +1,98 @@
|
||||
---
|
||||
frameworks:
|
||||
- Pytorch
|
||||
license: Apache License 2.0
|
||||
tasks:
|
||||
- text-generation
|
||||
|
||||
#model-type:
|
||||
##如 gpt、phi、llama、chatglm、baichuan 等
|
||||
#- gpt
|
||||
|
||||
#domain:
|
||||
##如 nlp、cv、audio、multi-modal
|
||||
#- nlp
|
||||
|
||||
#language:
|
||||
##语言代码列表 https://help.aliyun.com/document_detail/215387.html?spm=a2c4g.11186623.0.0.9f8d7467kni6Aa
|
||||
#- cn
|
||||
|
||||
#metrics:
|
||||
##如 CIDEr、Blue、ROUGE 等
|
||||
#- CIDEr
|
||||
|
||||
#tags:
|
||||
##各种自定义,包括 pretrained、fine-tuned、instruction-tuned、RL-tuned 等训练方法和其他
|
||||
#- pretrained
|
||||
|
||||
#tools:
|
||||
##如 vllm、fastchat、llamacpp、AdaSeq 等
|
||||
#- vllm
|
||||
language:
|
||||
- zh
|
||||
- en
|
||||
base_model:
|
||||
- OpenBMB/MiniCPM4-8B
|
||||
base_model_relation: quantized
|
||||
---
|
||||
|
||||
|
||||
### 介绍
|
||||
|
||||
1. 该模型基于 `https://www.modelscope.cn/models/OpenBMB/MiniCPM4-8B` 转换。
|
||||
2. 开源许可遵循 `MiniCPM4-8B`。
|
||||
|
||||
### 模型下载
|
||||
|
||||
#### SDK 下载
|
||||
|
||||
```bash
|
||||
# 安装 ModelScope
|
||||
pip install modelscope
|
||||
```
|
||||
```python
|
||||
# SDK模型下载
|
||||
from modelscope import snapshot_download
|
||||
model_dir = snapshot_download('xiaowangge/minicpm4-8b-gguf')
|
||||
```
|
||||
#### Git 下载
|
||||
|
||||
```
|
||||
# Git模型下载
|
||||
git clone https://www.modelscope.cn/xiaowangge/minicpm4-8b-gguf.git
|
||||
```
|
||||
|
||||
### 快速开始
|
||||
|
||||
> 本地构建或下载预构建形式的 `llama.cpp` 文件,使用 `llama-cli` 推理。
|
||||
|
||||
#### 源码构建 llama-cli
|
||||
```bash
|
||||
# 克隆 llama.cpp 源码
|
||||
git clone -b https://github.com/ggml-org/llama.cpp
|
||||
# 进入目录
|
||||
cd llama.cpp
|
||||
# 构建配置,开启 CUDA 加速,禁用 CURL
|
||||
cmake -B build -DGGML_CUDA=ON -DLLAMA_CURL=OFF
|
||||
# 多任务加速构建
|
||||
cmake --build build --config Release -j 10
|
||||
# 测试
|
||||
build/bin/llama-cli -h
|
||||
```
|
||||
|
||||
#### llama-cli 推理
|
||||
|
||||
```bash
|
||||
# GPU 加速
|
||||
build/bin/llama-cli -m ./minicpm4-8b-fp16.gguf -c 1024 -ngl 128 -n 512 -p "介绍下你自己"
|
||||
```
|
||||
|
||||
#### ollama 推理
|
||||
|
||||
> 如果不想进行复杂的 `llama.cpp `编译或配置,可使用 `ollama(version>=0.9.2)` 快速推理。
|
||||
|
||||
```bash
|
||||
ollama run xiaowangge/minicpm4
|
||||
```
|
||||
|
||||
|
||||
1
configuration.json
Normal file
1
configuration.json
Normal file
@@ -0,0 +1 @@
|
||||
{"framework":"Pytorch","task":"text-generation"}
|
||||
3
minicpm4-8b-fp16.gguf
Normal file
3
minicpm4-8b-fp16.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:cfe621d49d5cc5cee17043f5c96e93c00bd1c596f4ee140fe3baeb8366cc00d0
|
||||
size 16372735296
|
||||
3
minicpm4-8b-q4_K_M.gguf
Normal file
3
minicpm4-8b-q4_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:ccb5f071bf493b73029cbf190344cec01a599fafcc22e80de6361c396ddac07b
|
||||
size 4965526080
|
||||
3
minicpm4-8b-q8_0.gguf
Normal file
3
minicpm4-8b-q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:54bc78f66953d50e0c1a18bab8db71a283ebd7e366178f79d415388990a8adcc
|
||||
size 8699309376
|
||||
Reference in New Issue
Block a user