From 2dc4a4f205a06f7311a4ef801830bc0406c4db5b Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sat, 11 Apr 2026 15:10:00 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Intellecta-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++++++++++++ Intellecta.i1-IQ1_M.gguf | 3 ++ Intellecta.i1-IQ1_S.gguf | 3 ++ Intellecta.i1-IQ2_M.gguf | 3 ++ Intellecta.i1-IQ2_S.gguf | 3 ++ Intellecta.i1-IQ2_XS.gguf | 3 ++ Intellecta.i1-IQ2_XXS.gguf | 3 ++ Intellecta.i1-IQ3_M.gguf | 3 ++ Intellecta.i1-IQ3_S.gguf | 3 ++ Intellecta.i1-IQ3_XS.gguf | 3 ++ Intellecta.i1-IQ3_XXS.gguf | 3 ++ Intellecta.i1-IQ4_NL.gguf | 3 ++ Intellecta.i1-IQ4_XS.gguf | 3 ++ Intellecta.i1-Q2_K.gguf | 3 ++ Intellecta.i1-Q2_K_S.gguf | 3 ++ Intellecta.i1-Q3_K_L.gguf | 3 ++ Intellecta.i1-Q3_K_M.gguf | 3 ++ Intellecta.i1-Q3_K_S.gguf | 3 ++ Intellecta.i1-Q4_0.gguf | 3 ++ Intellecta.i1-Q4_1.gguf | 3 ++ Intellecta.i1-Q4_K_M.gguf | 3 ++ Intellecta.i1-Q4_K_S.gguf | 3 ++ Intellecta.i1-Q5_K_M.gguf | 3 ++ Intellecta.i1-Q5_K_S.gguf | 3 ++ Intellecta.i1-Q6_K.gguf | 3 ++ README.md | 85 ++++++++++++++++++++++++++++++++++++++ imatrix.dat | 3 ++ 27 files changed, 220 insertions(+) create mode 100644 .gitattributes create mode 100644 Intellecta.i1-IQ1_M.gguf create mode 100644 Intellecta.i1-IQ1_S.gguf create mode 100644 Intellecta.i1-IQ2_M.gguf create mode 100644 Intellecta.i1-IQ2_S.gguf create mode 100644 Intellecta.i1-IQ2_XS.gguf create mode 100644 Intellecta.i1-IQ2_XXS.gguf create mode 100644 Intellecta.i1-IQ3_M.gguf create mode 100644 Intellecta.i1-IQ3_S.gguf create mode 100644 Intellecta.i1-IQ3_XS.gguf create mode 100644 Intellecta.i1-IQ3_XXS.gguf create mode 100644 Intellecta.i1-IQ4_NL.gguf create mode 100644 Intellecta.i1-IQ4_XS.gguf create mode 100644 Intellecta.i1-Q2_K.gguf create mode 100644 Intellecta.i1-Q2_K_S.gguf create mode 100644 Intellecta.i1-Q3_K_L.gguf create mode 100644 Intellecta.i1-Q3_K_M.gguf create mode 100644 Intellecta.i1-Q3_K_S.gguf create mode 100644 Intellecta.i1-Q4_0.gguf create mode 100644 Intellecta.i1-Q4_1.gguf create mode 100644 Intellecta.i1-Q4_K_M.gguf create mode 100644 Intellecta.i1-Q4_K_S.gguf create mode 100644 Intellecta.i1-Q5_K_M.gguf create mode 100644 Intellecta.i1-Q5_K_S.gguf create mode 100644 Intellecta.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..f95c026 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Intellecta.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Intellecta.i1-IQ1_M.gguf b/Intellecta.i1-IQ1_M.gguf new file mode 100644 index 0000000..6b490a3 --- /dev/null +++ b/Intellecta.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae58a3ff550dde46dd4e8dedc8adba0f37460eadcfa0ba45479b601212feb990 +size 413604000 diff --git a/Intellecta.i1-IQ1_S.gguf b/Intellecta.i1-IQ1_S.gguf new file mode 100644 index 0000000..d738117 --- /dev/null +++ b/Intellecta.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:816130940de833c2f867e8f8c7e4c858c4f2b6c412671816d8f2f0cdd841dcba +size 393549984 diff --git a/Intellecta.i1-IQ2_M.gguf b/Intellecta.i1-IQ2_M.gguf new file mode 100644 index 0000000..24938b0 --- /dev/null +++ b/Intellecta.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d117ade93c7822384c8a5adab32c3d770bc6afc78d5f3a729e3bf57c10ec7b1 +size 515446944 diff --git a/Intellecta.i1-IQ2_S.gguf b/Intellecta.i1-IQ2_S.gguf new file mode 100644 index 0000000..0c831cb --- /dev/null +++ b/Intellecta.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c65dc51fa79156c516b5fbad50f7c501419eef1c81f0c176f5692676212fcad +size 488708256 diff --git a/Intellecta.i1-IQ2_XS.gguf b/Intellecta.i1-IQ2_XS.gguf new file mode 100644 index 0000000..3f3553a --- /dev/null +++ b/Intellecta.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:140780a1739e54e761a09951603cece7e2bddad9fc9862cc6588a8e2a48e419e +size 475863200 diff --git a/Intellecta.i1-IQ2_XXS.gguf b/Intellecta.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..d820055 --- /dev/null +++ b/Intellecta.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba99e963605c42dbfc25167788ccc3716c42d765f5cc8bd24198662af222ce6c +size 447027360 diff --git a/Intellecta.i1-IQ3_M.gguf b/Intellecta.i1-IQ3_M.gguf new file mode 100644 index 0000000..a21e43c --- /dev/null +++ b/Intellecta.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5a4c3f8f5f3f663a90cb4f3a97eefb0efc129661f28230f0c7ecd1a556c458c +size 657287328 diff --git a/Intellecta.i1-IQ3_S.gguf b/Intellecta.i1-IQ3_S.gguf new file mode 100644 index 0000000..412f03d --- /dev/null +++ b/Intellecta.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1235b4f8a8e12d3f37c1c94d2ff3af708d2365eb523a4e29f96b26ce4186ec1c +size 643917984 diff --git a/Intellecta.i1-IQ3_XS.gguf b/Intellecta.i1-IQ3_XS.gguf new file mode 100644 index 0000000..b07eda6 --- /dev/null +++ b/Intellecta.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01929d2a33109e5557d8b052f92f9ed07f2a75c392c382f8b72964f37788b4f1 +size 621111456 diff --git a/Intellecta.i1-IQ3_XXS.gguf b/Intellecta.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..a7c5baa --- /dev/null +++ b/Intellecta.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a215acf49a9e252112897cdce363b47234f4ec0f56e98ddb01cc31d017417f2 +size 562108576 diff --git a/Intellecta.i1-IQ4_NL.gguf b/Intellecta.i1-IQ4_NL.gguf new file mode 100644 index 0000000..ad501e3 --- /dev/null +++ b/Intellecta.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d934edcd761cf6c0413894824547c5735d0fc19ff080bbeb1c3761c3264277e6 +size 773023904 diff --git a/Intellecta.i1-IQ4_XS.gguf b/Intellecta.i1-IQ4_XS.gguf new file mode 100644 index 0000000..3e12dd8 --- /dev/null +++ b/Intellecta.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ca8cc9df25369da49ddeb60d0c9799c6a6b22b32e384de640981595310bc80 +size 743139488 diff --git a/Intellecta.i1-Q2_K.gguf b/Intellecta.i1-Q2_K.gguf new file mode 100644 index 0000000..348f137 --- /dev/null +++ b/Intellecta.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9363996e3736d3b1b6dbd64414a608936d7bd06c48075408aa3f99e5cbf46943 +size 580872352 diff --git a/Intellecta.i1-Q2_K_S.gguf b/Intellecta.i1-Q2_K_S.gguf new file mode 100644 index 0000000..7d84519 --- /dev/null +++ b/Intellecta.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e09f3f4b299ad626d78446caebdcd075af89022e8614c7a0a2a5a15bcd1cbd4 +size 554657952 diff --git a/Intellecta.i1-Q3_K_L.gguf b/Intellecta.i1-Q3_K_L.gguf new file mode 100644 index 0000000..73b304b --- /dev/null +++ b/Intellecta.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:520d72b34ffbee4d63da89449cd06e031d5abbf34def62bef35b5791d46c4c0c +size 732522656 diff --git a/Intellecta.i1-Q3_K_M.gguf b/Intellecta.i1-Q3_K_M.gguf new file mode 100644 index 0000000..9e7505b --- /dev/null +++ b/Intellecta.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4463768e9354f4ea5a4b2a321771d1c55bad176c1f4555a79803b49c1db0d9bc +size 690841760 diff --git a/Intellecta.i1-Q3_K_S.gguf b/Intellecta.i1-Q3_K_S.gguf new file mode 100644 index 0000000..f0542aa --- /dev/null +++ b/Intellecta.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f4f003a8edfa06993e6112747cf34c038c170fdb7ed59535147849993c5525a +size 641689760 diff --git a/Intellecta.i1-Q4_0.gguf b/Intellecta.i1-Q4_0.gguf new file mode 100644 index 0000000..8cad093 --- /dev/null +++ b/Intellecta.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fa9fda9b4fd22b32a08c70a96d66c5428a730b08a1268e0ff524b60d4ff6903 +size 773023904 diff --git a/Intellecta.i1-Q4_1.gguf b/Intellecta.i1-Q4_1.gguf new file mode 100644 index 0000000..4afcdbd --- /dev/null +++ b/Intellecta.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea742511a7e9992f6fefb7c54089a5ed80207bb9d1f457436b30a41e495b2e6 +size 831744160 diff --git a/Intellecta.i1-Q4_K_M.gguf b/Intellecta.i1-Q4_K_M.gguf new file mode 100644 index 0000000..44a0aa9 --- /dev/null +++ b/Intellecta.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30f54cba13f377dbfeac3be77afb605e6e141530dbdf27a3206b8fac46a659b5 +size 807692448 diff --git a/Intellecta.i1-Q4_K_S.gguf b/Intellecta.i1-Q4_K_S.gguf new file mode 100644 index 0000000..1c4f8f7 --- /dev/null +++ b/Intellecta.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12134c62dfb63c1cb901323931ceae11b1540fbeab1bf983793e056fe6316398 +size 775645344 diff --git a/Intellecta.i1-Q5_K_M.gguf b/Intellecta.i1-Q5_K_M.gguf new file mode 100644 index 0000000..937e0f7 --- /dev/null +++ b/Intellecta.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a9b957ca99bcb7dcac9e31af85b5cb41b2f395fdd725c2431287be1c8546297 +size 911501472 diff --git a/Intellecta.i1-Q5_K_S.gguf b/Intellecta.i1-Q5_K_S.gguf new file mode 100644 index 0000000..b8b81f5 --- /dev/null +++ b/Intellecta.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6247cb3739750dfc4e87bdd7f70a3fd381ee5613a3995d186f5317722f79439b +size 892561568 diff --git a/Intellecta.i1-Q6_K.gguf b/Intellecta.i1-Q6_K.gguf new file mode 100644 index 0000000..a68641f --- /dev/null +++ b/Intellecta.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73920dd088568b73c60157b665ccad899ad68c9809922431d20aa6d0c49eca37 +size 1021798560 diff --git a/README.md b/README.md new file mode 100644 index 0000000..c039dcf --- /dev/null +++ b/README.md @@ -0,0 +1,85 @@ +--- +base_model: kssrikar4/Intellecta +datasets: +- fka/awesome-chatgpt-prompts +- BAAI/Infinity-Instruct +- allenai/WildChat-1M +- lavita/ChatDoctor-HealthCareMagic-100k +- zjunlp/Mol-Instructions +- garage-bAInd/Open-Platypus +language: +- en +library_name: transformers +license: llama3.2 +quantized_by: mradermacher +tags: +- generated_from_trainer +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/kssrikar4/Intellecta + + +static quants are available at https://huggingface.co/mradermacher/Intellecta-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-IQ1_S.gguf) | i1-IQ1_S | 0.5 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-IQ1_M.gguf) | i1-IQ1_M | 0.5 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-IQ2_S.gguf) | i1-IQ2_S | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-IQ2_M.gguf) | i1-IQ2_M | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.7 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.7 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-Q2_K.gguf) | i1-Q2_K | 0.7 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-Q3_K_S.gguf) | i1-Q3_K_S | 0.7 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-IQ3_S.gguf) | i1-IQ3_S | 0.7 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-IQ3_M.gguf) | i1-IQ3_M | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-Q3_K_M.gguf) | i1-Q3_K_M | 0.8 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-Q3_K_L.gguf) | i1-Q3_K_L | 0.8 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-IQ4_XS.gguf) | i1-IQ4_XS | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-IQ4_NL.gguf) | i1-IQ4_NL | 0.9 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-Q4_0.gguf) | i1-Q4_0 | 0.9 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-Q4_K_S.gguf) | i1-Q4_K_S | 0.9 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-Q4_K_M.gguf) | i1-Q4_K_M | 0.9 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-Q4_1.gguf) | i1-Q4_1 | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-Q5_K_S.gguf) | i1-Q5_K_S | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-Q5_K_M.gguf) | i1-Q5_K_M | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/Intellecta-i1-GGUF/resolve/main/Intellecta.i1-Q6_K.gguf) | i1-Q6_K | 1.1 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..a705888 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04835684d85caf5674662527d82579367f79aa11f08359bd275dc3fe9c2131fd +size 1314413