commit 35a138af6b92ed9b157a8dffe89929a8351578d9 Author: ModelHub XC Date: Sat Jun 6 00:56:19 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Monika-24B-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..dd739c2 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,59 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Monika-24B.imatrix.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Monika-24B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Monika-24B.i1-IQ1_M.gguf b/Monika-24B.i1-IQ1_M.gguf new file mode 100644 index 0000000..f74376b --- /dev/null +++ b/Monika-24B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0544b8f312afe485cfc5d2b20a878ff118a9a4191f7674609c8d802fd863804 +size 5750502784 diff --git a/Monika-24B.i1-IQ1_S.gguf b/Monika-24B.i1-IQ1_S.gguf new file mode 100644 index 0000000..b09e8c0 --- /dev/null +++ b/Monika-24B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3ab7bbc5c41952ac165f4c7811e32e58c597a29a0f7f5c01892582f4fdd5fa1 +size 5273728384 diff --git a/Monika-24B.i1-IQ2_M.gguf b/Monika-24B.i1-IQ2_M.gguf new file mode 100644 index 0000000..862fa93 --- /dev/null +++ b/Monika-24B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2fb5c6f64e989ef57ffd5c77395a24c94e9622c05f5c5328a8e5b67406c7eed +size 8114059136 diff --git a/Monika-24B.i1-IQ2_S.gguf b/Monika-24B.i1-IQ2_S.gguf new file mode 100644 index 0000000..8fdcea2 --- /dev/null +++ b/Monika-24B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:954cfd21b84d7e91c150ad0aece1d59f45e81bc795f90c4ce8ee6de529dfa125 +size 7478359936 diff --git a/Monika-24B.i1-IQ2_XS.gguf b/Monika-24B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..549a411 --- /dev/null +++ b/Monika-24B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60fd26139bf8a6a14bec29e947ddddbeca9d3ce94a574822f96e4514379ecdc4 +size 7207040384 diff --git a/Monika-24B.i1-IQ2_XXS.gguf b/Monika-24B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..83351c2 --- /dev/null +++ b/Monika-24B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c36c6b0cebdd06ea215c8decd5d689c242230528df8afff840d4f69195acb85a +size 6545126784 diff --git a/Monika-24B.i1-IQ3_M.gguf b/Monika-24B.i1-IQ3_M.gguf new file mode 100644 index 0000000..947831b --- /dev/null +++ b/Monika-24B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d550ba3228b6ad6c6dbd0fcbbf3f8f7ccbddb5dcce6fb6faea94af97111ae12 +size 10650958400 diff --git a/Monika-24B.i1-IQ3_S.gguf b/Monika-24B.i1-IQ3_S.gguf new file mode 100644 index 0000000..42db312 --- /dev/null +++ b/Monika-24B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5909b40970d546a33581f8398bd5c84ea83f41023d31fecbdff561dfc3ceb9b7 +size 10428136000 diff --git a/Monika-24B.i1-IQ3_XS.gguf b/Monika-24B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..a1728ce --- /dev/null +++ b/Monika-24B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2e537fcdb87410ae6accf6ebb3f2a7f1527b3072528125f929c6b0ba544ecac +size 9907124800 diff --git a/Monika-24B.i1-IQ3_XXS.gguf b/Monika-24B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..5816903 --- /dev/null +++ b/Monika-24B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:152d98559d2a3f8493a66bc9eed525d576594b8fb1c309f52c724731823db837 +size 9280599936 diff --git a/Monika-24B.i1-IQ4_XS.gguf b/Monika-24B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..1030195 --- /dev/null +++ b/Monika-24B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e24ef252e86a08b4e3acfee2e4376c840d45cab53446fb3998f6486b28ea96f3 +size 12758924352 diff --git a/Monika-24B.i1-Q2_K.gguf b/Monika-24B.i1-Q2_K.gguf new file mode 100644 index 0000000..0f98eaa --- /dev/null +++ b/Monika-24B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ebe84f21137072bdc23167838df9269aa27f37cadb89afdcfc767ed68724f96 +size 8890333248 diff --git a/Monika-24B.i1-Q2_K_S.gguf b/Monika-24B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..de9512e --- /dev/null +++ b/Monika-24B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8486f76d0bdfff55412b99914da5d846a90ed8a4bc4dfb9d5c58e75f6e09b9e3 +size 8320170048 diff --git a/Monika-24B.i1-Q3_K_L.gguf b/Monika-24B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..473ad52 --- /dev/null +++ b/Monika-24B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20e925bce55d392df1cbaac2199895339b55654b2c3eaea433d567de68025891 +size 12400769600 diff --git a/Monika-24B.i1-Q3_K_M.gguf b/Monika-24B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..a9b8a24 --- /dev/null +++ b/Monika-24B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8b53d4cbd6132dcdcfc183909d588a517404c90cbf4e39b863abf61a26299a4 +size 11474090560 diff --git a/Monika-24B.i1-Q3_K_S.gguf b/Monika-24B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..7b2814e --- /dev/null +++ b/Monika-24B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18288902286de373eef7dbc6a820ca0bb2348f8a6beb6fdfcd975206000d6760 +size 10400283200 diff --git a/Monika-24B.i1-Q4_0.gguf b/Monika-24B.i1-Q4_0.gguf new file mode 100644 index 0000000..80d0944 --- /dev/null +++ b/Monika-24B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af5ce0261660d36c93a9efd0648cce016177b8ffcd18253943e98f94c40e6c0f +size 13494238432 diff --git a/Monika-24B.i1-Q4_1.gguf b/Monika-24B.i1-Q4_1.gguf new file mode 100644 index 0000000..c688076 --- /dev/null +++ b/Monika-24B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6e303b580f9964352f169ad6710061495f4ca8f762aca348adad41cce50c5ac +size 14873116192 diff --git a/Monika-24B.i1-Q4_K_M.gguf b/Monika-24B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..f82bd19 --- /dev/null +++ b/Monika-24B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a93ae22d064cbb22cf0abd82d3c5499bda50af44a3882b4236fc461b7d36e8fc +size 14333918432 diff --git a/Monika-24B.i1-Q4_K_S.gguf b/Monika-24B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..b91a686 --- /dev/null +++ b/Monika-24B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8ef942ddd58c41c5a4159eaaf281b7bd8b92c36965810baeb57151b4710ca30 +size 13549288672 diff --git a/Monika-24B.i1-Q5_K_M.gguf b/Monika-24B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..2ecb0bb --- /dev/null +++ b/Monika-24B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b65f5060d12e431de53c05c625e9be6f3739ec2180c562d451b7197f4b057e2 +size 16763993952 diff --git a/Monika-24B.i1-Q5_K_S.gguf b/Monika-24B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..f89cb26 --- /dev/null +++ b/Monika-24B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f37ae1511d1f7f66c3ecbee08311abd26064b68a44898f63d13a760589e5470e +size 16304422752 diff --git a/Monika-24B.i1-Q6_K.gguf b/Monika-24B.i1-Q6_K.gguf new file mode 100644 index 0000000..c260947 --- /dev/null +++ b/Monika-24B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f2a046b73dd1fb4c69fd892f8023e13e82ff31edfc69e1ef35df54d1885848d +size 19345949216 diff --git a/Monika-24B.imatrix.gguf b/Monika-24B.imatrix.gguf new file mode 100644 index 0000000..8b6299e --- /dev/null +++ b/Monika-24B.imatrix.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bd7e67733e38b3bdbe5c359d7b91763ec4df0cc20d2a843a19c1b595f1f1316 +size 10037312 diff --git a/README.md b/README.md new file mode 100644 index 0000000..d011ae1 --- /dev/null +++ b/README.md @@ -0,0 +1,86 @@ +--- +base_model: Green-eyedDevil/Monika-24B +language: +- en +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- roleplay +--- +## About + + + + + + + + + +weighted/imatrix quants of https://huggingface.co/Green-eyedDevil/Monika-24B + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Monika-24B-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/Monika-24B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.imatrix.gguf) | imatrix | 0.1 | imatrix file (for creating your own quants) | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-IQ1_S.gguf) | i1-IQ1_S | 5.4 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-IQ1_M.gguf) | i1-IQ1_M | 5.9 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 6.6 | | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 7.3 | | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-IQ2_S.gguf) | i1-IQ2_S | 7.6 | | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-IQ2_M.gguf) | i1-IQ2_M | 8.2 | | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 8.4 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-Q2_K.gguf) | i1-Q2_K | 9.0 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 9.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 10.0 | | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 10.5 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-IQ3_S.gguf) | i1-IQ3_S | 10.5 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-IQ3_M.gguf) | i1-IQ3_M | 10.8 | | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 11.6 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 12.5 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 12.9 | | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-Q4_0.gguf) | i1-Q4_0 | 13.6 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 13.6 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 14.4 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-Q4_1.gguf) | i1-Q4_1 | 15.0 | | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 16.4 | | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 16.9 | | +| [GGUF](https://huggingface.co/mradermacher/Monika-24B-i1-GGUF/resolve/main/Monika-24B.i1-Q6_K.gguf) | i1-Q6_K | 19.4 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + +