From 3ce37d849a987e4b1237c85c73157a652ff20302 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Mon, 20 Apr 2026 03:32:05 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF Source: Original Platform --- .gitattributes | 60 ++++++++++++++++++ DialoGPT-small-Rick-Bot.i1-IQ1_M.gguf | 3 + DialoGPT-small-Rick-Bot.i1-IQ1_S.gguf | 3 + DialoGPT-small-Rick-Bot.i1-IQ2_M.gguf | 3 + DialoGPT-small-Rick-Bot.i1-IQ2_S.gguf | 3 + DialoGPT-small-Rick-Bot.i1-IQ2_XS.gguf | 3 + DialoGPT-small-Rick-Bot.i1-IQ2_XXS.gguf | 3 + DialoGPT-small-Rick-Bot.i1-IQ3_M.gguf | 3 + DialoGPT-small-Rick-Bot.i1-IQ3_S.gguf | 3 + DialoGPT-small-Rick-Bot.i1-IQ3_XS.gguf | 3 + DialoGPT-small-Rick-Bot.i1-IQ3_XXS.gguf | 3 + DialoGPT-small-Rick-Bot.i1-IQ4_NL.gguf | 3 + DialoGPT-small-Rick-Bot.i1-IQ4_XS.gguf | 3 + DialoGPT-small-Rick-Bot.i1-Q2_K.gguf | 3 + DialoGPT-small-Rick-Bot.i1-Q2_K_S.gguf | 3 + DialoGPT-small-Rick-Bot.i1-Q3_K_L.gguf | 3 + DialoGPT-small-Rick-Bot.i1-Q3_K_M.gguf | 3 + DialoGPT-small-Rick-Bot.i1-Q3_K_S.gguf | 3 + DialoGPT-small-Rick-Bot.i1-Q4_0.gguf | 3 + DialoGPT-small-Rick-Bot.i1-Q4_1.gguf | 3 + DialoGPT-small-Rick-Bot.i1-Q4_K_M.gguf | 3 + DialoGPT-small-Rick-Bot.i1-Q4_K_S.gguf | 3 + DialoGPT-small-Rick-Bot.i1-Q5_K_M.gguf | 3 + DialoGPT-small-Rick-Bot.i1-Q5_K_S.gguf | 3 + DialoGPT-small-Rick-Bot.i1-Q6_K.gguf | 3 + README.md | 84 +++++++++++++++++++++++++ imatrix.dat | 3 + 27 files changed, 219 insertions(+) create mode 100644 .gitattributes create mode 100644 DialoGPT-small-Rick-Bot.i1-IQ1_M.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-IQ1_S.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-IQ2_M.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-IQ2_S.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-IQ2_XS.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-IQ2_XXS.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-IQ3_M.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-IQ3_S.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-IQ3_XS.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-IQ3_XXS.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-IQ4_NL.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-IQ4_XS.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-Q2_K.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-Q2_K_S.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-Q3_K_L.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-Q3_K_M.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-Q3_K_S.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-Q4_0.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-Q4_1.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-Q4_K_M.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-Q4_K_S.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-Q5_K_M.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-Q5_K_S.gguf create mode 100644 DialoGPT-small-Rick-Bot.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..51cc4e8 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DialoGPT-small-Rick-Bot.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/DialoGPT-small-Rick-Bot.i1-IQ1_M.gguf b/DialoGPT-small-Rick-Bot.i1-IQ1_M.gguf new file mode 100644 index 0000000..5b2d7ae --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a21aaead026c8d2979058a90f3d0889b8160f83e665e96c2f62bce3e0b9f96d +size 51057120 diff --git a/DialoGPT-small-Rick-Bot.i1-IQ1_S.gguf b/DialoGPT-small-Rick-Bot.i1-IQ1_S.gguf new file mode 100644 index 0000000..1484ef9 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe1bcf6c573f9c4be1063bec99fd68ba85b97589c9fa8511dde0c85ba1cfcaa8 +size 49287648 diff --git a/DialoGPT-small-Rick-Bot.i1-IQ2_M.gguf b/DialoGPT-small-Rick-Bot.i1-IQ2_M.gguf new file mode 100644 index 0000000..3455e0d --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a09c726abbc90891935f66ea8fbce5870e937e3c1401e3ae820d43d77244d32a +size 60180960 diff --git a/DialoGPT-small-Rick-Bot.i1-IQ2_S.gguf b/DialoGPT-small-Rick-Bot.i1-IQ2_S.gguf new file mode 100644 index 0000000..f091117 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:196cd8b23bd6f49e0da40e92e5ff88d6cebb74d76fa09cecbb3687b7519ec4bf +size 57821664 diff --git a/DialoGPT-small-Rick-Bot.i1-IQ2_XS.gguf b/DialoGPT-small-Rick-Bot.i1-IQ2_XS.gguf new file mode 100644 index 0000000..b773f3b --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df3e0112ffc0bbd33a855724a93efa251bf87dce56bbb5696e8b022d821fe03f +size 56586720 diff --git a/DialoGPT-small-Rick-Bot.i1-IQ2_XXS.gguf b/DialoGPT-small-Rick-Bot.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..df47ab7 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d338910e5ad61c83f09f58696f5ca55a59c15df0e690e71169fc613c6be4c02 +size 54006240 diff --git a/DialoGPT-small-Rick-Bot.i1-IQ3_M.gguf b/DialoGPT-small-Rick-Bot.i1-IQ3_M.gguf new file mode 100644 index 0000000..7979369 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02bf9756c4baac8d6144fa4c58ab466cc6ea3838682e448ccbb4c7c735528030 +size 77638176 diff --git a/DialoGPT-small-Rick-Bot.i1-IQ3_S.gguf b/DialoGPT-small-Rick-Bot.i1-IQ3_S.gguf new file mode 100644 index 0000000..53bd055 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d5255afe82a72889f6c351a8e8cddafedf0a4c89e7a30e0df4c59a27979edf7 +size 73564704 diff --git a/DialoGPT-small-Rick-Bot.i1-IQ3_XS.gguf b/DialoGPT-small-Rick-Bot.i1-IQ3_XS.gguf new file mode 100644 index 0000000..6c7a179 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae4e02bdbe8d65a9e6b008941b7947c081c3a34e8255af0373ae0453b66a030e +size 72569376 diff --git a/DialoGPT-small-Rick-Bot.i1-IQ3_XXS.gguf b/DialoGPT-small-Rick-Bot.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..c6f7a63 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd1372e6cc1028baaf9db0722df4152723e3e36e8fe4c23973361fbee05575e1 +size 64788960 diff --git a/DialoGPT-small-Rick-Bot.i1-IQ4_NL.gguf b/DialoGPT-small-Rick-Bot.i1-IQ4_NL.gguf new file mode 100644 index 0000000..5a9170d --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f357f027f4f00369e11bff52e2ff1a047b3d749f66cb8761b330c894521fd97a +size 84845088 diff --git a/DialoGPT-small-Rick-Bot.i1-IQ4_XS.gguf b/DialoGPT-small-Rick-Bot.i1-IQ4_XS.gguf new file mode 100644 index 0000000..1d49dce --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f18f6ce0a168e5a6263b5c30d481fd0fdea65048c7fd5408839d25f168ef07b +size 82190880 diff --git a/DialoGPT-small-Rick-Bot.i1-Q2_K.gguf b/DialoGPT-small-Rick-Bot.i1-Q2_K.gguf new file mode 100644 index 0000000..6a5ad7c --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0600d654ea257cf7eddd58e5b063509a0e27b38200e2d77a0a3108f0693d0af +size 68532768 diff --git a/DialoGPT-small-Rick-Bot.i1-Q2_K_S.gguf b/DialoGPT-small-Rick-Bot.i1-Q2_K_S.gguf new file mode 100644 index 0000000..01f6495 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad88f606076c568f2de144c9d182bc86017b3cf60335c8c19c451ce35854b74f +size 65491488 diff --git a/DialoGPT-small-Rick-Bot.i1-Q3_K_L.gguf b/DialoGPT-small-Rick-Bot.i1-Q3_K_L.gguf new file mode 100644 index 0000000..08825d3 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85532e3bc927b723ba34085fb56c5d631ace2349ba7109ce5f8884ffd29294a +size 85508640 diff --git a/DialoGPT-small-Rick-Bot.i1-Q3_K_M.gguf b/DialoGPT-small-Rick-Bot.i1-Q3_K_M.gguf new file mode 100644 index 0000000..886d6e7 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fb650fba30049b706a84452ad0e626c18ca8e4590c5cb9e219a8c22cf38c3d7 +size 81084960 diff --git a/DialoGPT-small-Rick-Bot.i1-Q3_K_S.gguf b/DialoGPT-small-Rick-Bot.i1-Q3_K_S.gguf new file mode 100644 index 0000000..f8586dc --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b61dd03821e39645eea464b9215cbf7c6e5c15b34553add34f34935b754c6713 +size 73564704 diff --git a/DialoGPT-small-Rick-Bot.i1-Q4_0.gguf b/DialoGPT-small-Rick-Bot.i1-Q4_0.gguf new file mode 100644 index 0000000..ed6cc87 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22d0fef51874cbe4b721061330a3452c84b94988386d1e626677ea27ec55647e +size 84992544 diff --git a/DialoGPT-small-Rick-Bot.i1-Q4_1.gguf b/DialoGPT-small-Rick-Bot.i1-Q4_1.gguf new file mode 100644 index 0000000..2d0188e --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:887f53cd792394167ed01882f7b689f01b62f971d7e62ac5963dc1914cc51cb2 +size 90153504 diff --git a/DialoGPT-small-Rick-Bot.i1-Q4_K_M.gguf b/DialoGPT-small-Rick-Bot.i1-Q4_K_M.gguf new file mode 100644 index 0000000..29c5a6a --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:671b85b736210a54ef8fec625ef29fe1662af626219df0816ad8df4f0a9920d7 +size 91148832 diff --git a/DialoGPT-small-Rick-Bot.i1-Q4_K_S.gguf b/DialoGPT-small-Rick-Bot.i1-Q4_K_S.gguf new file mode 100644 index 0000000..5de0b6d --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58711eee5d3256a0267cee88dc7e1c35c469b52ac5c1fcbbb290e87a9411628e +size 85140000 diff --git a/DialoGPT-small-Rick-Bot.i1-Q5_K_M.gguf b/DialoGPT-small-Rick-Bot.i1-Q5_K_M.gguf new file mode 100644 index 0000000..ebfeb43 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb1211057bdf4d89796b00cbb995ad3020a6da91dfcc2452fca40a6a9fef2d40 +size 100162080 diff --git a/DialoGPT-small-Rick-Bot.i1-Q5_K_S.gguf b/DialoGPT-small-Rick-Bot.i1-Q5_K_S.gguf new file mode 100644 index 0000000..3aa2826 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db46f903bef68f3434af13af6ed03a206a6ae990d56f9622e6ee4d67f873c29c +size 95461920 diff --git a/DialoGPT-small-Rick-Bot.i1-Q6_K.gguf b/DialoGPT-small-Rick-Bot.i1-Q6_K.gguf new file mode 100644 index 0000000..2027c80 --- /dev/null +++ b/DialoGPT-small-Rick-Bot.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb28b33944db3fec2c909a3c5f407c05a0ca9a225fee32962af15e290e0a3128 +size 106742304 diff --git a/README.md b/README.md new file mode 100644 index 0000000..908be5b --- /dev/null +++ b/README.md @@ -0,0 +1,84 @@ +--- +base_model: kingabzpro/DialoGPT-small-Rick-Bot +datasets: +- ysharma/rickandmorty +language: +- en +library_name: transformers +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- gpt-2 +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/kingabzpro/DialoGPT-small-Rick-Bot + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#DialoGPT-small-Rick-Bot-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-IQ1_S.gguf) | i1-IQ1_S | 0.1 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-IQ1_M.gguf) | i1-IQ1_M | 0.2 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-IQ2_S.gguf) | i1-IQ2_S | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-IQ2_M.gguf) | i1-IQ2_M | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.2 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.2 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-Q2_K.gguf) | i1-Q2_K | 0.2 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-IQ3_S.gguf) | i1-IQ3_S | 0.2 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-Q3_K_S.gguf) | i1-Q3_K_S | 0.2 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-IQ3_M.gguf) | i1-IQ3_M | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-Q3_K_M.gguf) | i1-Q3_K_M | 0.2 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-IQ4_XS.gguf) | i1-IQ4_XS | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-IQ4_NL.gguf) | i1-IQ4_NL | 0.2 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-Q4_0.gguf) | i1-Q4_0 | 0.2 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-Q4_K_S.gguf) | i1-Q4_K_S | 0.2 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-Q3_K_L.gguf) | i1-Q3_K_L | 0.2 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-Q4_1.gguf) | i1-Q4_1 | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-Q4_K_M.gguf) | i1-Q4_K_M | 0.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-Q5_K_S.gguf) | i1-Q5_K_S | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-Q5_K_M.gguf) | i1-Q5_K_M | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/DialoGPT-small-Rick-Bot-i1-GGUF/resolve/main/DialoGPT-small-Rick-Bot.i1-Q6_K.gguf) | i1-Q6_K | 0.2 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..a75c54c --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33878cb1d263586b6b3005a879ada2d5dc0a280a9c0b80053f93fe1592c3579f +size 259687