commit 6727feebaf50a6080e5c0aaab6ac34a50b3334de Author: ModelHub XC Date: Mon Apr 13 02:34:59 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Hermes-2-Pro-Mistral-7B-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..8d26f5c --- /dev/null +++ b/.gitattributes @@ -0,0 +1,49 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.f16.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Hermes-2-Pro-Mistral-7B.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Hermes-2-Pro-Mistral-7B.IQ3_M.gguf b/Hermes-2-Pro-Mistral-7B.IQ3_M.gguf new file mode 100644 index 0000000..81223a1 --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e7bd893c11f6f6ddf8b2bad7dfdb8102ce0d3ce5f4d80516d57378bda17675a +size 3285061664 diff --git a/Hermes-2-Pro-Mistral-7B.IQ3_S.gguf b/Hermes-2-Pro-Mistral-7B.IQ3_S.gguf new file mode 100644 index 0000000..7d2de78 --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b45d7c3f77ab5f18d9ae57afffd581160220ded4acf403cdf564bc3a1ac33054 +size 3182563360 diff --git a/Hermes-2-Pro-Mistral-7B.IQ3_XS.gguf b/Hermes-2-Pro-Mistral-7B.IQ3_XS.gguf new file mode 100644 index 0000000..67fbf34 --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1970b65afc26b62d821e64ec26ca906925610b9d75e35aa5ef22efea423ce352 +size 3018985504 diff --git a/Hermes-2-Pro-Mistral-7B.IQ4_XS.gguf b/Hermes-2-Pro-Mistral-7B.IQ4_XS.gguf new file mode 100644 index 0000000..3872c44 --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a47c9f234620ee72ce0428aee5b00c7e5578c5d7996c3023afa1f571518319f2 +size 3944571936 diff --git a/Hermes-2-Pro-Mistral-7B.Q2_K.gguf b/Hermes-2-Pro-Mistral-7B.Q2_K.gguf new file mode 100644 index 0000000..f632783 --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7507d1e0c68abf9fadf5a8cb3b13ff1dc767a4dc994d519919199cb99a06356 +size 2719398944 diff --git a/Hermes-2-Pro-Mistral-7B.Q3_K_L.gguf b/Hermes-2-Pro-Mistral-7B.Q3_K_L.gguf new file mode 100644 index 0000000..7dc5026 --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:223c65651524cd6805a24ddbb20d66c8b060a1df16afc8ffb84e4f069e6572e7 +size 3822194720 diff --git a/Hermes-2-Pro-Mistral-7B.Q3_K_M.gguf b/Hermes-2-Pro-Mistral-7B.Q3_K_M.gguf new file mode 100644 index 0000000..d4f9621 --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f96e716109a2ece0a8d115f7bdd00744df743b878ad756c5945600b130b58ba +size 3519156256 diff --git a/Hermes-2-Pro-Mistral-7B.Q3_K_S.gguf b/Hermes-2-Pro-Mistral-7B.Q3_K_S.gguf new file mode 100644 index 0000000..81e5bca --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b33d270d61b29eaf52523a2cf6bb177b37b76453151186e2c383e71770828ae +size 3164737568 diff --git a/Hermes-2-Pro-Mistral-7B.Q4_K_M.gguf b/Hermes-2-Pro-Mistral-7B.Q4_K_M.gguf new file mode 100644 index 0000000..7f59f1e --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6ad481aa7ab6a666e5201a4c2391f949973a89debe7159be470fa5229ba0a06 +size 4368626720 diff --git a/Hermes-2-Pro-Mistral-7B.Q4_K_S.gguf b/Hermes-2-Pro-Mistral-7B.Q4_K_S.gguf new file mode 100644 index 0000000..9a04997 --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff01612f4d6c25162de664a94af87aac263075b8a09acf10a1d8c28e5572009d +size 4140561440 diff --git a/Hermes-2-Pro-Mistral-7B.Q5_K_M.gguf b/Hermes-2-Pro-Mistral-7B.Q5_K_M.gguf new file mode 100644 index 0000000..b5fd435 --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5840832f148ffabc9022ae507b6aa86f71b5a8a568332179126e3611c61aa675 +size 5131613216 diff --git a/Hermes-2-Pro-Mistral-7B.Q5_K_S.gguf b/Hermes-2-Pro-Mistral-7B.Q5_K_S.gguf new file mode 100644 index 0000000..5d49873 --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79cf331289f52b2b5d2d6305428eacbe506305f3edca4190260dc62b7a68bcd2 +size 4997919776 diff --git a/Hermes-2-Pro-Mistral-7B.Q6_K.gguf b/Hermes-2-Pro-Mistral-7B.Q6_K.gguf new file mode 100644 index 0000000..329ea7f --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5adb55721025f49b2fc5976b1277fc77e6ce304ff528ebc8c88d820e6efa64 +size 5942286368 diff --git a/Hermes-2-Pro-Mistral-7B.Q8_0.gguf b/Hermes-2-Pro-Mistral-7B.Q8_0.gguf new file mode 100644 index 0000000..d2fa783 --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce8ea37420005a2e00526f56caa2901994d5c0e7d2f0e9f0857ae8f3f4576784 +size 7696142368 diff --git a/Hermes-2-Pro-Mistral-7B.f16.gguf b/Hermes-2-Pro-Mistral-7B.f16.gguf new file mode 100644 index 0000000..0c30a47 --- /dev/null +++ b/Hermes-2-Pro-Mistral-7B.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:090a81648436fbb4150a9bdf2677f2b0e8d1d0ee85a71b89c8b3df669fa114cd +size 14485262368 diff --git a/README.md b/README.md new file mode 100644 index 0000000..8df0ce8 --- /dev/null +++ b/README.md @@ -0,0 +1,81 @@ +--- +base_model: NousResearch/Hermes-2-Pro-Mistral-7B +datasets: +- teknium/OpenHermes-2.5 +language: +- en +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- Mistral +- instruct +- finetune +- chatml +- DPO +- RLHF +- gpt4 +- synthetic data +- distillation +- function calling +- json mode +--- +## About + + + + + + +static quants of https://huggingface.co/NousResearch/Hermes-2-Pro-Mistral-7B + + +weighted/imatrix quants are available at https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-i1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.Q2_K.gguf) | Q2_K | 2.8 | | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.IQ3_XS.gguf) | IQ3_XS | 3.1 | | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.Q3_K_S.gguf) | Q3_K_S | 3.3 | | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.IQ3_S.gguf) | IQ3_S | 3.3 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.IQ3_M.gguf) | IQ3_M | 3.4 | | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.Q3_K_M.gguf) | Q3_K_M | 3.6 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.Q3_K_L.gguf) | Q3_K_L | 3.9 | | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.IQ4_XS.gguf) | IQ4_XS | 4.0 | | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.Q4_K_S.gguf) | Q4_K_S | 4.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.Q4_K_M.gguf) | Q4_K_M | 4.5 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.Q5_K_S.gguf) | Q5_K_S | 5.1 | | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.Q5_K_M.gguf) | Q5_K_M | 5.2 | | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.Q6_K.gguf) | Q6_K | 6.0 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.Q8_0.gguf) | Q8_0 | 7.8 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/Hermes-2-Pro-Mistral-7B-GGUF/resolve/main/Hermes-2-Pro-Mistral-7B.f16.gguf) | f16 | 14.6 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + +