From a973f543c99faf3753502c6e4dfea1f5410d2236 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sun, 12 Apr 2026 21:17:00 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/neo_7b-ortho-GGUF Source: Original Platform --- .gitattributes | 50 ++++++++++++++++++++++++++++++ README.md | 66 ++++++++++++++++++++++++++++++++++++++++ neo_7b-ortho.IQ3_M.gguf | 3 ++ neo_7b-ortho.IQ3_S.gguf | 3 ++ neo_7b-ortho.IQ3_XS.gguf | 3 ++ neo_7b-ortho.IQ4_XS.gguf | 3 ++ neo_7b-ortho.Q2_K.gguf | 3 ++ neo_7b-ortho.Q3_K_L.gguf | 3 ++ neo_7b-ortho.Q3_K_M.gguf | 3 ++ neo_7b-ortho.Q3_K_S.gguf | 3 ++ neo_7b-ortho.Q4_K_M.gguf | 3 ++ neo_7b-ortho.Q4_K_S.gguf | 3 ++ neo_7b-ortho.Q5_K_M.gguf | 3 ++ neo_7b-ortho.Q5_K_S.gguf | 3 ++ neo_7b-ortho.Q6_K.gguf | 3 ++ neo_7b-ortho.Q8_0.gguf | 3 ++ neo_7b-ortho.f16.gguf | 3 ++ 17 files changed, 161 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 neo_7b-ortho.IQ3_M.gguf create mode 100644 neo_7b-ortho.IQ3_S.gguf create mode 100644 neo_7b-ortho.IQ3_XS.gguf create mode 100644 neo_7b-ortho.IQ4_XS.gguf create mode 100644 neo_7b-ortho.Q2_K.gguf create mode 100644 neo_7b-ortho.Q3_K_L.gguf create mode 100644 neo_7b-ortho.Q3_K_M.gguf create mode 100644 neo_7b-ortho.Q3_K_S.gguf create mode 100644 neo_7b-ortho.Q4_K_M.gguf create mode 100644 neo_7b-ortho.Q4_K_S.gguf create mode 100644 neo_7b-ortho.Q5_K_M.gguf create mode 100644 neo_7b-ortho.Q5_K_S.gguf create mode 100644 neo_7b-ortho.Q6_K.gguf create mode 100644 neo_7b-ortho.Q8_0.gguf create mode 100644 neo_7b-ortho.f16.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..ec4d9e4 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,50 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.f16.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +neo_7b-ortho.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..c3128c1 --- /dev/null +++ b/README.md @@ -0,0 +1,66 @@ +--- +base_model: DewEfresh/neo_7b-ortho +language: +- en +library_name: transformers +quantized_by: mradermacher +--- +## About + + + + + + +static quants of https://huggingface.co/DewEfresh/neo_7b-ortho + + +weighted/imatrix quants seem not to be available (by me) at this time. If they do not show up a week or so after the static ones, I have probably not planned for them. Feel free to request them by opening a Community Discussion. +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.Q2_K.gguf) | Q2_K | 3.0 | | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.IQ3_XS.gguf) | IQ3_XS | 3.4 | | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.IQ3_S.gguf) | IQ3_S | 3.5 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.Q3_K_S.gguf) | Q3_K_S | 3.5 | | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.IQ3_M.gguf) | IQ3_M | 3.6 | | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.Q3_K_M.gguf) | Q3_K_M | 3.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.Q3_K_L.gguf) | Q3_K_L | 4.2 | | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.IQ4_XS.gguf) | IQ4_XS | 4.3 | | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.Q4_K_S.gguf) | Q4_K_S | 4.6 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.Q4_K_M.gguf) | Q4_K_M | 4.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.Q5_K_S.gguf) | Q5_K_S | 5.5 | | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.Q5_K_M.gguf) | Q5_K_M | 5.6 | | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.Q6_K.gguf) | Q6_K | 6.5 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.Q8_0.gguf) | Q8_0 | 8.4 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/neo_7b-ortho-GGUF/resolve/main/neo_7b-ortho.f16.gguf) | f16 | 15.7 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + + diff --git a/neo_7b-ortho.IQ3_M.gguf b/neo_7b-ortho.IQ3_M.gguf new file mode 100644 index 0000000..2f951c7 --- /dev/null +++ b/neo_7b-ortho.IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dd57a9b69cbcffa35eb742de7ee331455b08f443d8ef5fc55c98b50313fb8e2 +size 3528336960 diff --git a/neo_7b-ortho.IQ3_S.gguf b/neo_7b-ortho.IQ3_S.gguf new file mode 100644 index 0000000..850c956 --- /dev/null +++ b/neo_7b-ortho.IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adabc1109682ba3c961cabc12fe70252624e30fbefdd05c238a7d31fac515c2a +size 3428066880 diff --git a/neo_7b-ortho.IQ3_XS.gguf b/neo_7b-ortho.IQ3_XS.gguf new file mode 100644 index 0000000..ae72f14 --- /dev/null +++ b/neo_7b-ortho.IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86cd8326a4688fc39cf0b087719c81ee81ac55fe841d7b63fc800a8972cf49c6 +size 3254658624 diff --git a/neo_7b-ortho.IQ4_XS.gguf b/neo_7b-ortho.IQ4_XS.gguf new file mode 100644 index 0000000..3dd6417 --- /dev/null +++ b/neo_7b-ortho.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:140a66deb7c5d7471982d9396d67145558abc1b29debae92e0670ae117da7354 +size 4234939968 diff --git a/neo_7b-ortho.Q2_K.gguf b/neo_7b-ortho.Q2_K.gguf new file mode 100644 index 0000000..3271edd --- /dev/null +++ b/neo_7b-ortho.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:331644815b9efda6e5fb03f20fc79e0341c050b4db9953a2a7b39f22b9cfe502 +size 2924953152 diff --git a/neo_7b-ortho.Q3_K_L.gguf b/neo_7b-ortho.Q3_K_L.gguf new file mode 100644 index 0000000..44d078d --- /dev/null +++ b/neo_7b-ortho.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf12a26af4291cd8c3cc47aece6a04a78253de072d65289fbe8b0c8b7dfc51f9 +size 4109313600 diff --git a/neo_7b-ortho.Q3_K_M.gguf b/neo_7b-ortho.Q3_K_M.gguf new file mode 100644 index 0000000..4469912 --- /dev/null +++ b/neo_7b-ortho.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6403dfb0741b7a34dac90657d87284433effdc132d66d843ead690eae5e3f9c +size 3790808640 diff --git a/neo_7b-ortho.Q3_K_S.gguf b/neo_7b-ortho.Q3_K_S.gguf new file mode 100644 index 0000000..cd453a0 --- /dev/null +++ b/neo_7b-ortho.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c156f9f6cae1ea739c009111d19d04f77d43ea5e9b390d27b2929979186eef9e +size 3428066880 diff --git a/neo_7b-ortho.Q4_K_M.gguf b/neo_7b-ortho.Q4_K_M.gguf new file mode 100644 index 0000000..cf401f9 --- /dev/null +++ b/neo_7b-ortho.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:643b89a5472bbfe52f0ca2bc6d7e5cdf061d729750b059ab8cc7c33de4940354 +size 4743491136 diff --git a/neo_7b-ortho.Q4_K_S.gguf b/neo_7b-ortho.Q4_K_S.gguf new file mode 100644 index 0000000..2df6ccc --- /dev/null +++ b/neo_7b-ortho.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d08fee36d733efb0e04ce645dfd6cbf3d3fcd07fd338592667fdde842b3d9f6 +size 4469960256 diff --git a/neo_7b-ortho.Q5_K_M.gguf b/neo_7b-ortho.Q5_K_M.gguf new file mode 100644 index 0000000..3f52a52 --- /dev/null +++ b/neo_7b-ortho.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:086487d50a8fab89ba365d971b3d6cbbcef45b5155e9045080f54e5af1469f49 +size 5544373824 diff --git a/neo_7b-ortho.Q5_K_S.gguf b/neo_7b-ortho.Q5_K_S.gguf new file mode 100644 index 0000000..5b295f2 --- /dev/null +++ b/neo_7b-ortho.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb795d55a4157a81f4de855f206056c849cb8e4d0a66a2bf1ef649e1d6a79042 +size 5386448448 diff --git a/neo_7b-ortho.Q6_K.gguf b/neo_7b-ortho.Q6_K.gguf new file mode 100644 index 0000000..64d09ca --- /dev/null +++ b/neo_7b-ortho.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13043b5fe51461953768d23ff7a2882aef7eb6e5c9d2a1b72fb5f4d4dcb18b33 +size 6395311680 diff --git a/neo_7b-ortho.Q8_0.gguf b/neo_7b-ortho.Q8_0.gguf new file mode 100644 index 0000000..b72da1c --- /dev/null +++ b/neo_7b-ortho.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76fdcf026db78d2f54aff163d6a43561a97bdb3f16fb2e4c4017e444a4c3d799 +size 8282809920 diff --git a/neo_7b-ortho.f16.gguf b/neo_7b-ortho.f16.gguf new file mode 100644 index 0000000..492f92d --- /dev/null +++ b/neo_7b-ortho.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c77b8c6de33823807b96b3cb7325a6a93ca254b25398a878ab1a50e5f1c87790 +size 15589254720