commit 4455c9e60c11ef63e1d1b241f451e94285462e8f Author: ModelHub XC Date: Wed May 20 07:53:37 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Deita-34b-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..4fd2a04 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,57 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Deita-34b.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Deita-34b.i1-IQ1_M.gguf b/Deita-34b.i1-IQ1_M.gguf new file mode 100644 index 0000000..35220bb --- /dev/null +++ b/Deita-34b.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea4a43e8934b3fb22069b16c6b276042e784833cfead4df7027af6781112077e +size 8176786208 diff --git a/Deita-34b.i1-IQ1_S.gguf b/Deita-34b.i1-IQ1_S.gguf new file mode 100644 index 0000000..a6ed54d --- /dev/null +++ b/Deita-34b.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3fd80e8c1a2bec57a976b623d9c28ded16105996958181125a984ebe1ff24d2 +size 7498980128 diff --git a/Deita-34b.i1-IQ2_M.gguf b/Deita-34b.i1-IQ2_M.gguf new file mode 100644 index 0000000..478d4e9 --- /dev/null +++ b/Deita-34b.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f902a02e241332cda9af73fbd6a7ee448318aa2fd3a388e3aff87af7167ef38 +size 11794762528 diff --git a/Deita-34b.i1-IQ2_S.gguf b/Deita-34b.i1-IQ2_S.gguf new file mode 100644 index 0000000..4f2995f --- /dev/null +++ b/Deita-34b.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd59adf5d1419c102804f0336665295846d01353eabe595f98df7db8228de9bf +size 10891021088 diff --git a/Deita-34b.i1-IQ2_XS.gguf b/Deita-34b.i1-IQ2_XS.gguf new file mode 100644 index 0000000..9c99b58 --- /dev/null +++ b/Deita-34b.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8055016cebb32408cc3c2cc03dbbc60a2c6b2e0c06ea44f994133f50d44ebb +size 10306542368 diff --git a/Deita-34b.i1-IQ2_XXS.gguf b/Deita-34b.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..71b608b --- /dev/null +++ b/Deita-34b.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8fc40fef66aa5e80289d97569fbc7d14f401ed026e644e03eff11b88f08e289 +size 9306463008 diff --git a/Deita-34b.i1-IQ3_M.gguf b/Deita-34b.i1-IQ3_M.gguf new file mode 100644 index 0000000..2d5909f --- /dev/null +++ b/Deita-34b.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0220b463d9edcffb025c8ac98420fa40ef4bdc4d78431b7aab2855c046af748f +size 15564700448 diff --git a/Deita-34b.i1-IQ3_S.gguf b/Deita-34b.i1-IQ3_S.gguf new file mode 100644 index 0000000..0aee621 --- /dev/null +++ b/Deita-34b.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a657e08d8ee4a6d0cbb3751acaab193f272044a508a5255965a0582c1d24c291 +size 15018785568 diff --git a/Deita-34b.i1-IQ3_XS.gguf b/Deita-34b.i1-IQ3_XS.gguf new file mode 100644 index 0000000..ac8a8fa --- /dev/null +++ b/Deita-34b.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:207b2b74bd8835f7a5d45f0f1d0c833b6c01222d9216053338c8aa2dd29cb2e1 +size 14234319648 diff --git a/Deita-34b.i1-IQ3_XXS.gguf b/Deita-34b.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..86cde24 --- /dev/null +++ b/Deita-34b.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:501433307e1714221a252d699067c5ff2be2176831b2f063cc4198373837b74c +size 13333875488 diff --git a/Deita-34b.i1-IQ4_XS.gguf b/Deita-34b.i1-IQ4_XS.gguf new file mode 100644 index 0000000..1d661f6 --- /dev/null +++ b/Deita-34b.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a8c03d40ae61014d2c71c7093eb567eb8b31d2cfd8bc1309042649ed9f24956 +size 18475051808 diff --git a/Deita-34b.i1-Q2_K.gguf b/Deita-34b.i1-Q2_K.gguf new file mode 100644 index 0000000..ff79325 --- /dev/null +++ b/Deita-34b.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95470f55287a95579786772e3b3482456a4803ed870bdbac3f3a296888c63026 +size 12825234208 diff --git a/Deita-34b.i1-Q3_K_L.gguf b/Deita-34b.i1-Q3_K_L.gguf new file mode 100644 index 0000000..698718f --- /dev/null +++ b/Deita-34b.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b90c38ea2499d86e3e39d3a117c3edd8e8758f0b642035c4022c4b130e100ce0 +size 18139446048 diff --git a/Deita-34b.i1-Q3_K_M.gguf b/Deita-34b.i1-Q3_K_M.gguf new file mode 100644 index 0000000..1ffb817 --- /dev/null +++ b/Deita-34b.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66479a7c1e93bcfdc981a1e997ed3e808b43b73473373062b47c3d7c11fb0c80 +size 16654924576 diff --git a/Deita-34b.i1-Q3_K_S.gguf b/Deita-34b.i1-Q3_K_S.gguf new file mode 100644 index 0000000..5a6afcf --- /dev/null +++ b/Deita-34b.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbc7d785c24b60dc1b341d95d5fec15eb2223f647242a605c2309401a9588e62 +size 14960294688 diff --git a/Deita-34b.i1-Q4_0.gguf b/Deita-34b.i1-Q4_0.gguf new file mode 100644 index 0000000..7f19e92 --- /dev/null +++ b/Deita-34b.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83a1af3d1ce37b322d67e3ff15729d999c17f4e20100612a4365783c92786eff +size 19530754848 diff --git a/Deita-34b.i1-Q4_K_M.gguf b/Deita-34b.i1-Q4_K_M.gguf new file mode 100644 index 0000000..d28d950 --- /dev/null +++ b/Deita-34b.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42e2ca62ea3503178c5fc03d7a63cd67615ce1a08845f8857c835e541f48cf0e +size 20658711328 diff --git a/Deita-34b.i1-Q4_K_S.gguf b/Deita-34b.i1-Q4_K_S.gguf new file mode 100644 index 0000000..9c5d394 --- /dev/null +++ b/Deita-34b.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab73d7b035480702da0b44b62d3167a57aa4264b14f67fce647f75674ed795c8 +size 19598650144 diff --git a/Deita-34b.i1-Q5_K_M.gguf b/Deita-34b.i1-Q5_K_M.gguf new file mode 100644 index 0000000..f6071d5 --- /dev/null +++ b/Deita-34b.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4204a71e3ef9cdad6d735cc7f96086b911e7259f47aeadac1bb17af7ac4eebeb +size 24321846048 diff --git a/Deita-34b.i1-Q5_K_S.gguf b/Deita-34b.i1-Q5_K_S.gguf new file mode 100644 index 0000000..8736dbc --- /dev/null +++ b/Deita-34b.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff58dc62cd033379007f4130162da26d2eb05437713f162159f496eb44ef83db +size 23707691808 diff --git a/Deita-34b.i1-Q6_K.gguf b/Deita-34b.i1-Q6_K.gguf new file mode 100644 index 0000000..0ea7648 --- /dev/null +++ b/Deita-34b.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12991e32ba22a381e1cc27ce13ea4a9ab6c3c394f228f9cb266c3de8920ae4f +size 28213926688 diff --git a/README.md b/README.md new file mode 100644 index 0000000..2398e93 --- /dev/null +++ b/README.md @@ -0,0 +1,74 @@ +--- +base_model: KnutJaegersberg/Deita-34b +datasets: +- KnutJaegersberg/Deita-6k +language: +- en +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +--- +## About + + + + + +weighted/imatrix quants of https://huggingface.co/KnutJaegersberg/Deita-34b + + +static quants are available at https://huggingface.co/mradermacher/Deita-34b-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-IQ1_S.gguf) | i1-IQ1_S | 7.6 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-IQ1_M.gguf) | i1-IQ1_M | 8.3 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 9.4 | | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-IQ2_XS.gguf) | i1-IQ2_XS | 10.4 | | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-IQ2_S.gguf) | i1-IQ2_S | 11.0 | | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-IQ2_M.gguf) | i1-IQ2_M | 11.9 | | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-Q2_K.gguf) | i1-Q2_K | 12.9 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 13.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-IQ3_XS.gguf) | i1-IQ3_XS | 14.3 | | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-Q3_K_S.gguf) | i1-Q3_K_S | 15.1 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-IQ3_S.gguf) | i1-IQ3_S | 15.1 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-IQ3_M.gguf) | i1-IQ3_M | 15.7 | | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-Q3_K_M.gguf) | i1-Q3_K_M | 16.8 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-Q3_K_L.gguf) | i1-Q3_K_L | 18.2 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-IQ4_XS.gguf) | i1-IQ4_XS | 18.6 | | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-Q4_0.gguf) | i1-Q4_0 | 19.6 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-Q4_K_S.gguf) | i1-Q4_K_S | 19.7 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-Q4_K_M.gguf) | i1-Q4_K_M | 20.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-Q5_K_S.gguf) | i1-Q5_K_S | 23.8 | | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-Q5_K_M.gguf) | i1-Q5_K_M | 24.4 | | +| [GGUF](https://huggingface.co/mradermacher/Deita-34b-i1-GGUF/resolve/main/Deita-34b.i1-Q6_K.gguf) | i1-Q6_K | 28.3 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..6fbf770 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cebfeffbc1cd772bcf85308763202792e8393e6a8b5410141f194b58c8ed17b +size 15251067