From b160640347820dd8fa88dd9632dd8afa155d6ead Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Tue, 21 Apr 2026 22:11:39 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++ Falcon3-3B-Instruct-Heretic.i1-IQ1_M.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-IQ1_S.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-IQ2_M.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-IQ2_S.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-IQ2_XS.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-IQ2_XXS.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-IQ3_M.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-IQ3_S.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-IQ3_XS.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-IQ3_XXS.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-IQ4_NL.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-IQ4_XS.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-Q2_K.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-Q2_K_S.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-Q3_K_L.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-Q3_K_M.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-Q3_K_S.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-Q4_0.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-Q4_1.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-Q4_K_M.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-Q4_K_S.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-Q5_K_M.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-Q5_K_S.gguf | 3 + Falcon3-3B-Instruct-Heretic.i1-Q6_K.gguf | 3 + Falcon3-3B-Instruct-Heretic.imatrix.gguf | 3 + README.md | 99 +++++++++++++++++++++ 27 files changed, 234 insertions(+) create mode 100644 .gitattributes create mode 100644 Falcon3-3B-Instruct-Heretic.i1-IQ1_M.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-IQ1_S.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-IQ2_M.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-IQ2_S.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-IQ2_XS.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-IQ2_XXS.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-IQ3_M.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-IQ3_S.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-IQ3_XS.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-IQ3_XXS.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-IQ4_NL.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-IQ4_XS.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-Q2_K.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-Q2_K_S.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-Q3_K_L.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-Q3_K_M.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-Q3_K_S.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-Q4_0.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-Q4_1.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-Q4_K_M.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-Q4_K_S.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-Q5_K_M.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-Q5_K_S.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.i1-Q6_K.gguf create mode 100644 Falcon3-3B-Instruct-Heretic.imatrix.gguf create mode 100644 README.md diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..3bcbdce --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.imatrix.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Falcon3-3B-Instruct-Heretic.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Falcon3-3B-Instruct-Heretic.i1-IQ1_M.gguf b/Falcon3-3B-Instruct-Heretic.i1-IQ1_M.gguf new file mode 100644 index 0000000..9827898 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8496c2f0f0ee4265d40efdc7eab1030b364755d83b2ed5fb538fe5167a5ecc5 +size 965973120 diff --git a/Falcon3-3B-Instruct-Heretic.i1-IQ1_S.gguf b/Falcon3-3B-Instruct-Heretic.i1-IQ1_S.gguf new file mode 100644 index 0000000..476cb7c --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:345810d45006ee0282132c209aa26749aae3dc5e3889747eb82305ab9ce3e270 +size 917017728 diff --git a/Falcon3-3B-Instruct-Heretic.i1-IQ2_M.gguf b/Falcon3-3B-Instruct-Heretic.i1-IQ2_M.gguf new file mode 100644 index 0000000..c780145 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd414c75d969f860ff7776d21c8983106ec8dd482c5e7dc59c2fb7bcefcf3b0 +size 1267471488 diff --git a/Falcon3-3B-Instruct-Heretic.i1-IQ2_S.gguf b/Falcon3-3B-Instruct-Heretic.i1-IQ2_S.gguf new file mode 100644 index 0000000..151b0ee --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cbf1c723ec5b6f7a262021cf976f6d45b8a7593c481bdae92a8bdbbcdf3c224 +size 1202197632 diff --git a/Falcon3-3B-Instruct-Heretic.i1-IQ2_XS.gguf b/Falcon3-3B-Instruct-Heretic.i1-IQ2_XS.gguf new file mode 100644 index 0000000..ce2edd0 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ec9fed38f6e533ee92ef1cf0ebcb921d2d35fe824451250ff2d7b2afc1887d +size 1119327360 diff --git a/Falcon3-3B-Instruct-Heretic.i1-IQ2_XXS.gguf b/Falcon3-3B-Instruct-Heretic.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..b2ef3b2 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1a6f04997e2c01a2714c91f76c3dda7c817a54eedc8e87be87532f51dca3737 +size 1047565440 diff --git a/Falcon3-3B-Instruct-Heretic.i1-IQ3_M.gguf b/Falcon3-3B-Instruct-Heretic.i1-IQ3_M.gguf new file mode 100644 index 0000000..ba090dd --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a94e7bf505e377dbafd0b1805f949fa7435cbdfde5023c0b2d7198e114b55fdf +size 1593693312 diff --git a/Falcon3-3B-Instruct-Heretic.i1-IQ3_S.gguf b/Falcon3-3B-Instruct-Heretic.i1-IQ3_S.gguf new file mode 100644 index 0000000..01d6b3d --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:979314a53794e23ed450b08f8df961abdf319b66324ad64b4b24633e35407edc +size 1549407360 diff --git a/Falcon3-3B-Instruct-Heretic.i1-IQ3_XS.gguf b/Falcon3-3B-Instruct-Heretic.i1-IQ3_XS.gguf new file mode 100644 index 0000000..c03da96 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38480b2a867dcf2d81a77035b4252a296be08e858f8eea26f01c56aaa4721753 +size 1491309696 diff --git a/Falcon3-3B-Instruct-Heretic.i1-IQ3_XXS.gguf b/Falcon3-3B-Instruct-Heretic.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..71a6628 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86bcb95d2a8a9f7820b6b4c58f134f90b8876eaf6194cdd1eab51b681f0e1a44 +size 1374819456 diff --git a/Falcon3-3B-Instruct-Heretic.i1-IQ4_NL.gguf b/Falcon3-3B-Instruct-Heretic.i1-IQ4_NL.gguf new file mode 100644 index 0000000..d4be77d --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54ef6eaf13799f9058259f0cbc1746b0855cee1017802517423656d55fab404a +size 1924584576 diff --git a/Falcon3-3B-Instruct-Heretic.i1-IQ4_XS.gguf b/Falcon3-3B-Instruct-Heretic.i1-IQ4_XS.gguf new file mode 100644 index 0000000..2371ee2 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a317fca9eb7a755dacd810e31c4868d524bf6f5ea66a86138413ed7ffa4b211 +size 1836307584 diff --git a/Falcon3-3B-Instruct-Heretic.i1-Q2_K.gguf b/Falcon3-3B-Instruct-Heretic.i1-Q2_K.gguf new file mode 100644 index 0000000..093d918 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea62a7e8e60e2d3c2122f15540a7282beedc4df28422bf1020c08327e9135348 +size 1353880704 diff --git a/Falcon3-3B-Instruct-Heretic.i1-Q2_K_S.gguf b/Falcon3-3B-Instruct-Heretic.i1-Q2_K_S.gguf new file mode 100644 index 0000000..10f9ebe --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c38f5f7c34b14b79313817234ea52d58fdda84d225f7f5b0f838455b3fd16e7d +size 1275778176 diff --git a/Falcon3-3B-Instruct-Heretic.i1-Q3_K_L.gguf b/Falcon3-3B-Instruct-Heretic.i1-Q3_K_L.gguf new file mode 100644 index 0000000..ee8b2c3 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dec14838ea793899020ac3aedbdbe54cbea1edced570d6feae76d844b1b9727 +size 1781355648 diff --git a/Falcon3-3B-Instruct-Heretic.i1-Q3_K_M.gguf b/Falcon3-3B-Instruct-Heretic.i1-Q3_K_M.gguf new file mode 100644 index 0000000..2521de1 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c643e803ac502d739e4525190f1f938596cc1c82bac81799afcae309b5da3e +size 1673221248 diff --git a/Falcon3-3B-Instruct-Heretic.i1-Q3_K_S.gguf b/Falcon3-3B-Instruct-Heretic.i1-Q3_K_S.gguf new file mode 100644 index 0000000..7af283e --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:759d51ea37033546d30864a6048f3e205a91af812cbe0f43f493cf8bbf2d6cb7 +size 1549407360 diff --git a/Falcon3-3B-Instruct-Heretic.i1-Q4_0.gguf b/Falcon3-3B-Instruct-Heretic.i1-Q4_0.gguf new file mode 100644 index 0000000..49a0f8e --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d28d0a5deec2f8c4529c3d9d77088f0d4f4afdedbd02ec0c263465795ea8abc3 +size 1928123520 diff --git a/Falcon3-3B-Instruct-Heretic.i1-Q4_1.gguf b/Falcon3-3B-Instruct-Heretic.i1-Q4_1.gguf new file mode 100644 index 0000000..e1d59cc --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f67560c900ce6d3d7471a8442dd729232a1e19d7fc971412aaba314d5c68aa51 +size 2101138560 diff --git a/Falcon3-3B-Instruct-Heretic.i1-Q4_K_M.gguf b/Falcon3-3B-Instruct-Heretic.i1-Q4_K_M.gguf new file mode 100644 index 0000000..16b9e7b --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad1f2a89e9dac48e2f64aae8280b246ccd19528409a634c1128ab7b7fb8a51bf +size 2005685376 diff --git a/Falcon3-3B-Instruct-Heretic.i1-Q4_K_S.gguf b/Falcon3-3B-Instruct-Heretic.i1-Q4_K_S.gguf new file mode 100644 index 0000000..ba65bf4 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20573ffb2de4267f1660979de2e84c8c59cede96236231badfdce547b2303756 +size 1933235328 diff --git a/Falcon3-3B-Instruct-Heretic.i1-Q5_K_M.gguf b/Falcon3-3B-Instruct-Heretic.i1-Q5_K_M.gguf new file mode 100644 index 0000000..fe20ec0 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2476010c84a57be4be5495f9d9bd45aa81fed64fa22e691801682f5668a36d3f +size 2319471744 diff --git a/Falcon3-3B-Instruct-Heretic.i1-Q5_K_S.gguf b/Falcon3-3B-Instruct-Heretic.i1-Q5_K_S.gguf new file mode 100644 index 0000000..fd57e41 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8975c298f488881ce70c189ccbb6f9c9517d4a4cfe55e798fada36bc383e4cea +size 2277692544 diff --git a/Falcon3-3B-Instruct-Heretic.i1-Q6_K.gguf b/Falcon3-3B-Instruct-Heretic.i1-Q6_K.gguf new file mode 100644 index 0000000..949bfe5 --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f29f7b97ea2b759ec20bf062b5bb78a94dedd93b7e74de004ca1a751a507138 +size 2652869760 diff --git a/Falcon3-3B-Instruct-Heretic.imatrix.gguf b/Falcon3-3B-Instruct-Heretic.imatrix.gguf new file mode 100644 index 0000000..caae95a --- /dev/null +++ b/Falcon3-3B-Instruct-Heretic.imatrix.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d782b840d498dd970ad81be279f49025462528411988e89a33d4146438bf2eb +size 2456768 diff --git a/README.md b/README.md new file mode 100644 index 0000000..19e0a70 --- /dev/null +++ b/README.md @@ -0,0 +1,99 @@ +--- +base_model: ChiKoi7/Falcon3-3B-Instruct-Heretic +language: +- en +- fr +- es +- pt +library_name: transformers +license: other +license_link: https://falconllm.tii.ae/falcon-terms-and-conditions.html +license_name: falcon-llm-license +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- Falcon +- Falcon3 +- tiiuae +- 3b +- Instruct +- Heretic +- Uncensored +- Abliterated +--- +## About + + + + + + + + + +weighted/imatrix quants of https://huggingface.co/ChiKoi7/Falcon3-3B-Instruct-Heretic + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Falcon3-3B-Instruct-Heretic-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.imatrix.gguf) | imatrix | 0.1 | imatrix file (for creating your own quants) | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-IQ1_S.gguf) | i1-IQ1_S | 1.0 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-IQ1_M.gguf) | i1-IQ1_M | 1.1 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-IQ2_XS.gguf) | i1-IQ2_XS | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-IQ2_S.gguf) | i1-IQ2_S | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-IQ2_M.gguf) | i1-IQ2_M | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-Q2_K_S.gguf) | i1-Q2_K_S | 1.4 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-Q2_K.gguf) | i1-Q2_K | 1.5 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 1.5 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-IQ3_XS.gguf) | i1-IQ3_XS | 1.6 | | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-IQ3_S.gguf) | i1-IQ3_S | 1.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-Q3_K_S.gguf) | i1-Q3_K_S | 1.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-IQ3_M.gguf) | i1-IQ3_M | 1.7 | | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.8 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.9 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.9 | | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-IQ4_NL.gguf) | i1-IQ4_NL | 2.0 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-Q4_0.gguf) | i1-Q4_0 | 2.0 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-Q4_K_S.gguf) | i1-Q4_K_S | 2.0 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-Q4_K_M.gguf) | i1-Q4_K_M | 2.1 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-Q4_1.gguf) | i1-Q4_1 | 2.2 | | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-Q5_K_S.gguf) | i1-Q5_K_S | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-Q5_K_M.gguf) | i1-Q5_K_M | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/Falcon3-3B-Instruct-Heretic-i1-GGUF/resolve/main/Falcon3-3B-Instruct-Heretic.i1-Q6_K.gguf) | i1-Q6_K | 2.8 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + +