From 80cd1a3c5fac85a9e558245906c418b009350f7e Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sat, 11 Apr 2026 03:16:58 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF Source: Original Platform --- .gitattributes | 60 ++++++++++++++++++ Phi4.React.Turn.V2.Full.i1-IQ1_M.gguf | 3 + Phi4.React.Turn.V2.Full.i1-IQ1_S.gguf | 3 + Phi4.React.Turn.V2.Full.i1-IQ2_M.gguf | 3 + Phi4.React.Turn.V2.Full.i1-IQ2_S.gguf | 3 + Phi4.React.Turn.V2.Full.i1-IQ2_XS.gguf | 3 + Phi4.React.Turn.V2.Full.i1-IQ2_XXS.gguf | 3 + Phi4.React.Turn.V2.Full.i1-IQ3_M.gguf | 3 + Phi4.React.Turn.V2.Full.i1-IQ3_S.gguf | 3 + Phi4.React.Turn.V2.Full.i1-IQ3_XS.gguf | 3 + Phi4.React.Turn.V2.Full.i1-IQ3_XXS.gguf | 3 + Phi4.React.Turn.V2.Full.i1-IQ4_NL.gguf | 3 + Phi4.React.Turn.V2.Full.i1-IQ4_XS.gguf | 3 + Phi4.React.Turn.V2.Full.i1-Q2_K.gguf | 3 + Phi4.React.Turn.V2.Full.i1-Q2_K_S.gguf | 3 + Phi4.React.Turn.V2.Full.i1-Q3_K_L.gguf | 3 + Phi4.React.Turn.V2.Full.i1-Q3_K_M.gguf | 3 + Phi4.React.Turn.V2.Full.i1-Q3_K_S.gguf | 3 + Phi4.React.Turn.V2.Full.i1-Q4_0.gguf | 3 + Phi4.React.Turn.V2.Full.i1-Q4_1.gguf | 3 + Phi4.React.Turn.V2.Full.i1-Q4_K_M.gguf | 3 + Phi4.React.Turn.V2.Full.i1-Q4_K_S.gguf | 3 + Phi4.React.Turn.V2.Full.i1-Q5_K_M.gguf | 3 + Phi4.React.Turn.V2.Full.i1-Q5_K_S.gguf | 3 + Phi4.React.Turn.V2.Full.i1-Q6_K.gguf | 3 + README.md | 84 +++++++++++++++++++++++++ imatrix.dat | 3 + 27 files changed, 219 insertions(+) create mode 100644 .gitattributes create mode 100644 Phi4.React.Turn.V2.Full.i1-IQ1_M.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-IQ1_S.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-IQ2_M.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-IQ2_S.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-IQ2_XS.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-IQ2_XXS.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-IQ3_M.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-IQ3_S.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-IQ3_XS.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-IQ3_XXS.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-IQ4_NL.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-IQ4_XS.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-Q2_K.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-Q2_K_S.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-Q3_K_L.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-Q3_K_M.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-Q3_K_S.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-Q4_0.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-Q4_1.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-Q4_K_M.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-Q4_K_S.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-Q5_K_M.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-Q5_K_S.gguf create mode 100644 Phi4.React.Turn.V2.Full.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..f4a6d6d --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Phi4.React.Turn.V2.Full.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Phi4.React.Turn.V2.Full.i1-IQ1_M.gguf b/Phi4.React.Turn.V2.Full.i1-IQ1_M.gguf new file mode 100644 index 0000000..50ff6b5 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00f96bd4902a82ffe798a2669c44e64295f17b3b5428367c8b83e2fdbb9d02e3 +size 3690189280 diff --git a/Phi4.React.Turn.V2.Full.i1-IQ1_S.gguf b/Phi4.React.Turn.V2.Full.i1-IQ1_S.gguf new file mode 100644 index 0000000..64419e7 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16bb886f52221c74b1db7b3b438a2b5758adc4b2173bd65ab8ce414712da6164 +size 3412173280 diff --git a/Phi4.React.Turn.V2.Full.i1-IQ2_M.gguf b/Phi4.React.Turn.V2.Full.i1-IQ2_M.gguf new file mode 100644 index 0000000..431a090 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b00537e86eaa999f773eb5a18d1d438585383367c09de861a4e11b80fc0e67e +size 5173924320 diff --git a/Phi4.React.Turn.V2.Full.i1-IQ2_S.gguf b/Phi4.React.Turn.V2.Full.i1-IQ2_S.gguf new file mode 100644 index 0000000..11a2dda --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3671db2279b0e14680f304482c8cad4e27fa0afb75b1d00eec2807222e19c9cb +size 4803236320 diff --git a/Phi4.React.Turn.V2.Full.i1-IQ2_XS.gguf b/Phi4.React.Turn.V2.Full.i1-IQ2_XS.gguf new file mode 100644 index 0000000..ff5e545 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffbdf09727196c3f230ee652d839689cdf5447ba18129fbafbf399d69dd60bc3 +size 4557005280 diff --git a/Phi4.React.Turn.V2.Full.i1-IQ2_XXS.gguf b/Phi4.React.Turn.V2.Full.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..214e10a --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2c0336f04ced624e70617aae36c41ef856fe807b2645fc180382d3dd499c92b +size 4153549280 diff --git a/Phi4.React.Turn.V2.Full.i1-IQ3_M.gguf b/Phi4.React.Turn.V2.Full.i1-IQ3_M.gguf new file mode 100644 index 0000000..6132ef3 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a42543d3f6c18263af9f424243f4a1c6c238c9fe7902328e76c4f5e1b2654725 +size 6739763680 diff --git a/Phi4.React.Turn.V2.Full.i1-IQ3_S.gguf b/Phi4.React.Turn.V2.Full.i1-IQ3_S.gguf new file mode 100644 index 0000000..cbce5f8 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cee6b688f655ba9c22c3feb7a65655ef68a5cca9813e78f3f83e6b6c0952fcc6 +size 6539571680 diff --git a/Phi4.React.Turn.V2.Full.i1-IQ3_XS.gguf b/Phi4.React.Turn.V2.Full.i1-IQ3_XS.gguf new file mode 100644 index 0000000..0f08088 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dee5ed13b69a5d0f2cb4314c8350dd0d6a34081dba61a1b5caa7050a1c9e4a2f +size 6220083680 diff --git a/Phi4.React.Turn.V2.Full.i1-IQ3_XXS.gguf b/Phi4.React.Turn.V2.Full.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..4b786de --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8da498172e5a3c209030b17f6b9c2494e447e37ffb89b688c3b88037d28791a +size 5811876320 diff --git a/Phi4.React.Turn.V2.Full.i1-IQ4_NL.gguf b/Phi4.React.Turn.V2.Full.i1-IQ4_NL.gguf new file mode 100644 index 0000000..60487b6 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:903715efd3aead4800483f3010c8b877b4be60594f1cdcd485acf073f4e29e36 +size 8416195040 diff --git a/Phi4.React.Turn.V2.Full.i1-IQ4_XS.gguf b/Phi4.React.Turn.V2.Full.i1-IQ4_XS.gguf new file mode 100644 index 0000000..7208c1b --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ad4689b959bba340a161f37050d79dba09505676a35925f53318d452bbda11c +size 7982346720 diff --git a/Phi4.React.Turn.V2.Full.i1-Q2_K.gguf b/Phi4.React.Turn.V2.Full.i1-Q2_K.gguf new file mode 100644 index 0000000..d232252 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:506983bd7b2032b1f16f2f18ec6feb32eddba8a2279b28a79abdaae186d391ac +size 5608796640 diff --git a/Phi4.React.Turn.V2.Full.i1-Q2_K_S.gguf b/Phi4.React.Turn.V2.Full.i1-Q2_K_S.gguf new file mode 100644 index 0000000..4cc3710 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:190a6d9a590899232a4c93faede7b160ab3fe310a59e5c68e1ec1498d5edcf5c +size 5237084640 diff --git a/Phi4.React.Turn.V2.Full.i1-Q3_K_L.gguf b/Phi4.React.Turn.V2.Full.i1-Q3_K_L.gguf new file mode 100644 index 0000000..7534d57 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f541ee50982a7ba10fcdfcd3a91aef04d420e82d3b3db0ef3572078e27dd87 +size 7788851680 diff --git a/Phi4.React.Turn.V2.Full.i1-Q3_K_M.gguf b/Phi4.React.Turn.V2.Full.i1-Q3_K_M.gguf new file mode 100644 index 0000000..79421dd --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fe1be4061c192528da50bb0fc3a19ed5e0f18c7a997c46782a579cba33d6b04 +size 7190835680 diff --git a/Phi4.React.Turn.V2.Full.i1-Q3_K_S.gguf b/Phi4.React.Turn.V2.Full.i1-Q3_K_S.gguf new file mode 100644 index 0000000..ef28fac --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f990262f9d0d42127f8cfbeb2cfb4e4458ed53d0d3386fe052e3b1aa5942b36d +size 6504755680 diff --git a/Phi4.React.Turn.V2.Full.i1-Q4_0.gguf b/Phi4.React.Turn.V2.Full.i1-Q4_0.gguf new file mode 100644 index 0000000..69d0d15 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a493ef35166588be506b743172ecbabaf471520ee2e9f6269f11af1a706a4d +size 8412099040 diff --git a/Phi4.React.Turn.V2.Full.i1-Q4_1.gguf b/Phi4.React.Turn.V2.Full.i1-Q4_1.gguf new file mode 100644 index 0000000..774d1ce --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a7b292ea51875eea40a5699dcaf1a497bf60e3b3c57de1198dadad6f6d16c1e +size 9267507680 diff --git a/Phi4.React.Turn.V2.Full.i1-Q4_K_M.gguf b/Phi4.React.Turn.V2.Full.i1-Q4_K_M.gguf new file mode 100644 index 0000000..1f23ac2 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64126e0f48298248f07007a8d5145b6c19255d87cb0533dcc9afb71563d90475 +size 8890307040 diff --git a/Phi4.React.Turn.V2.Full.i1-Q4_K_S.gguf b/Phi4.React.Turn.V2.Full.i1-Q4_K_S.gguf new file mode 100644 index 0000000..cf3050d --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391c2af93c8ec4630c607fd41e25cd6e9a06c3156556eac74de9b5bbeeab95ba +size 8444047840 diff --git a/Phi4.React.Turn.V2.Full.i1-Q5_K_M.gguf b/Phi4.React.Turn.V2.Full.i1-Q5_K_M.gguf new file mode 100644 index 0000000..dbbfa03 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7399e1d371b77eeaddb4ce71e3650965eba81dd71e19163d555777287ec1986f +size 10412708320 diff --git a/Phi4.React.Turn.V2.Full.i1-Q5_K_S.gguf b/Phi4.React.Turn.V2.Full.i1-Q5_K_S.gguf new file mode 100644 index 0000000..aef2c8d --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c79b02532f45cddad4893720ed4bee625ab76ba458178ff80bb8307d9fc6770 +size 10151588320 diff --git a/Phi4.React.Turn.V2.Full.i1-Q6_K.gguf b/Phi4.React.Turn.V2.Full.i1-Q6_K.gguf new file mode 100644 index 0000000..eb84d90 --- /dev/null +++ b/Phi4.React.Turn.V2.Full.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391580b4e8ba1c25626fd1d7f4151c3b7738a5ed45fa3dca717936f3ca13591c +size 12030259680 diff --git a/README.md b/README.md new file mode 100644 index 0000000..c57cc49 --- /dev/null +++ b/README.md @@ -0,0 +1,84 @@ +--- +base_model: Quazim0t0/Phi4.React.Turn.V2.Full +datasets: +- cfahlgren1/react-code-instructions +language: +- en +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- text-generation-inference +- transformers +- unsloth +- llama +- gguf +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/Quazim0t0/Phi4.React.Turn.V2.Full + + +static quants are available at https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-IQ1_S.gguf) | i1-IQ1_S | 3.5 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-IQ1_M.gguf) | i1-IQ1_M | 3.8 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 4.3 | | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-IQ2_XS.gguf) | i1-IQ2_XS | 4.7 | | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-IQ2_S.gguf) | i1-IQ2_S | 4.9 | | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-IQ2_M.gguf) | i1-IQ2_M | 5.3 | | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-Q2_K_S.gguf) | i1-Q2_K_S | 5.3 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-Q2_K.gguf) | i1-Q2_K | 5.7 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 5.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-IQ3_XS.gguf) | i1-IQ3_XS | 6.3 | | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-Q3_K_S.gguf) | i1-Q3_K_S | 6.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-IQ3_S.gguf) | i1-IQ3_S | 6.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-IQ3_M.gguf) | i1-IQ3_M | 6.8 | | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-Q3_K_M.gguf) | i1-Q3_K_M | 7.3 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-Q3_K_L.gguf) | i1-Q3_K_L | 7.9 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-IQ4_XS.gguf) | i1-IQ4_XS | 8.1 | | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-Q4_0.gguf) | i1-Q4_0 | 8.5 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-IQ4_NL.gguf) | i1-IQ4_NL | 8.5 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-Q4_K_S.gguf) | i1-Q4_K_S | 8.5 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-Q4_K_M.gguf) | i1-Q4_K_M | 9.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-Q4_1.gguf) | i1-Q4_1 | 9.4 | | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-Q5_K_S.gguf) | i1-Q5_K_S | 10.3 | | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-Q5_K_M.gguf) | i1-Q5_K_M | 10.5 | | +| [GGUF](https://huggingface.co/mradermacher/Phi4.React.Turn.V2.Full-i1-GGUF/resolve/main/Phi4.React.Turn.V2.Full.i1-Q6_K.gguf) | i1-Q6_K | 12.1 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..fac59de --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077d2b899947b5be16c71974e853b39bb13c95b1e321c1e6787ee35192373506 +size 7791685