From 36c9ae27691abe0747c77ef38a84d62562c80888 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Thu, 14 May 2026 10:20:37 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/InternVL3-2B-Instruct-i1-GGUF Source: Original Platform --- .gitattributes | 60 ++++++++++++++++++ InternVL3-2B-Instruct.i1-IQ1_M.gguf | 3 + InternVL3-2B-Instruct.i1-IQ1_S.gguf | 3 + InternVL3-2B-Instruct.i1-IQ2_M.gguf | 3 + InternVL3-2B-Instruct.i1-IQ2_S.gguf | 3 + InternVL3-2B-Instruct.i1-IQ2_XS.gguf | 3 + InternVL3-2B-Instruct.i1-IQ2_XXS.gguf | 3 + InternVL3-2B-Instruct.i1-IQ3_M.gguf | 3 + InternVL3-2B-Instruct.i1-IQ3_S.gguf | 3 + InternVL3-2B-Instruct.i1-IQ3_XS.gguf | 3 + InternVL3-2B-Instruct.i1-IQ3_XXS.gguf | 3 + InternVL3-2B-Instruct.i1-IQ4_NL.gguf | 3 + InternVL3-2B-Instruct.i1-IQ4_XS.gguf | 3 + InternVL3-2B-Instruct.i1-Q2_K.gguf | 3 + InternVL3-2B-Instruct.i1-Q2_K_S.gguf | 3 + InternVL3-2B-Instruct.i1-Q3_K_L.gguf | 3 + InternVL3-2B-Instruct.i1-Q3_K_M.gguf | 3 + InternVL3-2B-Instruct.i1-Q3_K_S.gguf | 3 + InternVL3-2B-Instruct.i1-Q4_0.gguf | 3 + InternVL3-2B-Instruct.i1-Q4_1.gguf | 3 + InternVL3-2B-Instruct.i1-Q4_K_M.gguf | 3 + InternVL3-2B-Instruct.i1-Q4_K_S.gguf | 3 + InternVL3-2B-Instruct.i1-Q5_K_M.gguf | 3 + InternVL3-2B-Instruct.i1-Q5_K_S.gguf | 3 + InternVL3-2B-Instruct.i1-Q6_K.gguf | 3 + README.md | 88 +++++++++++++++++++++++++++ imatrix.dat | 3 + 27 files changed, 223 insertions(+) create mode 100644 .gitattributes create mode 100644 InternVL3-2B-Instruct.i1-IQ1_M.gguf create mode 100644 InternVL3-2B-Instruct.i1-IQ1_S.gguf create mode 100644 InternVL3-2B-Instruct.i1-IQ2_M.gguf create mode 100644 InternVL3-2B-Instruct.i1-IQ2_S.gguf create mode 100644 InternVL3-2B-Instruct.i1-IQ2_XS.gguf create mode 100644 InternVL3-2B-Instruct.i1-IQ2_XXS.gguf create mode 100644 InternVL3-2B-Instruct.i1-IQ3_M.gguf create mode 100644 InternVL3-2B-Instruct.i1-IQ3_S.gguf create mode 100644 InternVL3-2B-Instruct.i1-IQ3_XS.gguf create mode 100644 InternVL3-2B-Instruct.i1-IQ3_XXS.gguf create mode 100644 InternVL3-2B-Instruct.i1-IQ4_NL.gguf create mode 100644 InternVL3-2B-Instruct.i1-IQ4_XS.gguf create mode 100644 InternVL3-2B-Instruct.i1-Q2_K.gguf create mode 100644 InternVL3-2B-Instruct.i1-Q2_K_S.gguf create mode 100644 InternVL3-2B-Instruct.i1-Q3_K_L.gguf create mode 100644 InternVL3-2B-Instruct.i1-Q3_K_M.gguf create mode 100644 InternVL3-2B-Instruct.i1-Q3_K_S.gguf create mode 100644 InternVL3-2B-Instruct.i1-Q4_0.gguf create mode 100644 InternVL3-2B-Instruct.i1-Q4_1.gguf create mode 100644 InternVL3-2B-Instruct.i1-Q4_K_M.gguf create mode 100644 InternVL3-2B-Instruct.i1-Q4_K_S.gguf create mode 100644 InternVL3-2B-Instruct.i1-Q5_K_M.gguf create mode 100644 InternVL3-2B-Instruct.i1-Q5_K_S.gguf create mode 100644 InternVL3-2B-Instruct.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..367b655 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL3-2B-Instruct.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/InternVL3-2B-Instruct.i1-IQ1_M.gguf b/InternVL3-2B-Instruct.i1-IQ1_M.gguf new file mode 100644 index 0000000..92fdf92 --- /dev/null +++ b/InternVL3-2B-Instruct.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aa1355f8a90fd8bb8c578337f80c021ee3a312a379b814c150c41a41fcad78a +size 540623136 diff --git a/InternVL3-2B-Instruct.i1-IQ1_S.gguf b/InternVL3-2B-Instruct.i1-IQ1_S.gguf new file mode 100644 index 0000000..123b29a --- /dev/null +++ b/InternVL3-2B-Instruct.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80013d033f288aa3bd8bcbeca261163c7ecd7ea3c71f024accffade184a2555b +size 512689440 diff --git a/InternVL3-2B-Instruct.i1-IQ2_M.gguf b/InternVL3-2B-Instruct.i1-IQ2_M.gguf new file mode 100644 index 0000000..d756847 --- /dev/null +++ b/InternVL3-2B-Instruct.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf223edadf1ac4af1f008f8661a53cfdc30fd6fbbb96fc379fc83aa7517f376e +size 700877696 diff --git a/InternVL3-2B-Instruct.i1-IQ2_S.gguf b/InternVL3-2B-Instruct.i1-IQ2_S.gguf new file mode 100644 index 0000000..c47b0b7 --- /dev/null +++ b/InternVL3-2B-Instruct.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7bb0b60ea0243003c248578cc24e85c4f82a34a1e8b03bb4343b88e170a42f0 +size 663632768 diff --git a/InternVL3-2B-Instruct.i1-IQ2_XS.gguf b/InternVL3-2B-Instruct.i1-IQ2_XS.gguf new file mode 100644 index 0000000..4d0a70b --- /dev/null +++ b/InternVL3-2B-Instruct.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c7f01f84646fb17b66cafdd2b4f072990437f809c1e05d19a0027af28cba4b +size 626488608 diff --git a/InternVL3-2B-Instruct.i1-IQ2_XXS.gguf b/InternVL3-2B-Instruct.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..136efcd --- /dev/null +++ b/InternVL3-2B-Instruct.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ed15387e3a34c5ec60cecc322dbb3eda16599b6561e85c2dff230630f66496 +size 587179296 diff --git a/InternVL3-2B-Instruct.i1-IQ3_M.gguf b/InternVL3-2B-Instruct.i1-IQ3_M.gguf new file mode 100644 index 0000000..1ca74c6 --- /dev/null +++ b/InternVL3-2B-Instruct.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49eab93591a8c5bfdc476ae87f1cda18a0a7ee593dfabc8307832b1ad3b80dba +size 876433600 diff --git a/InternVL3-2B-Instruct.i1-IQ3_S.gguf b/InternVL3-2B-Instruct.i1-IQ3_S.gguf new file mode 100644 index 0000000..11fc9c1 --- /dev/null +++ b/InternVL3-2B-Instruct.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:043bc053dc24e992b77ed49877f92c9cf7dc977ae9af719f58bcb25269c77adc +size 862176448 diff --git a/InternVL3-2B-Instruct.i1-IQ3_XS.gguf b/InternVL3-2B-Instruct.i1-IQ3_XS.gguf new file mode 100644 index 0000000..f81cc10 --- /dev/null +++ b/InternVL3-2B-Instruct.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12a245a00bd113e014e755bd604dd4d5ac273652cb4d1bcbd7ad9539dc2cd256 +size 831468736 diff --git a/InternVL3-2B-Instruct.i1-IQ3_XXS.gguf b/InternVL3-2B-Instruct.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..d3eed52 --- /dev/null +++ b/InternVL3-2B-Instruct.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef4e14410a0b038190780b265ee5a4c0f0891d9c56a2e7a01893c20f36e2384a +size 768615296 diff --git a/InternVL3-2B-Instruct.i1-IQ4_NL.gguf b/InternVL3-2B-Instruct.i1-IQ4_NL.gguf new file mode 100644 index 0000000..cb90c4e --- /dev/null +++ b/InternVL3-2B-Instruct.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b88ef5e6cadcd131953b4adadc2d912c7f4337ca5947f919376799d2c7532746 +size 1067042272 diff --git a/InternVL3-2B-Instruct.i1-IQ4_XS.gguf b/InternVL3-2B-Instruct.i1-IQ4_XS.gguf new file mode 100644 index 0000000..5a5b8dd --- /dev/null +++ b/InternVL3-2B-Instruct.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e6c6d16df58ec905eb4f704560649ea7c090bb77d4a5bcbd087c7ee2fd19e1a +size 1019162368 diff --git a/InternVL3-2B-Instruct.i1-Q2_K.gguf b/InternVL3-2B-Instruct.i1-Q2_K.gguf new file mode 100644 index 0000000..2fc6eec --- /dev/null +++ b/InternVL3-2B-Instruct.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3f05c7cac1b4f91c77d09f666485bc59aca09d0947641770fcb225b7f22a68a +size 752413280 diff --git a/InternVL3-2B-Instruct.i1-Q2_K_S.gguf b/InternVL3-2B-Instruct.i1-Q2_K_S.gguf new file mode 100644 index 0000000..dc403eb --- /dev/null +++ b/InternVL3-2B-Instruct.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f1bd94ae80bb1d1e0d987aeefcf3ea343994053845a5bed5dbbbbe1ff31fa6 +size 716243552 diff --git a/InternVL3-2B-Instruct.i1-Q3_K_L.gguf b/InternVL3-2B-Instruct.i1-Q3_K_L.gguf new file mode 100644 index 0000000..42b4d38 --- /dev/null +++ b/InternVL3-2B-Instruct.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:788e865b058d051d413eb8e6c4bcbb86e6fce47fdcfc0ecb0f6816381b6d43d0 +size 979932352 diff --git a/InternVL3-2B-Instruct.i1-Q3_K_M.gguf b/InternVL3-2B-Instruct.i1-Q3_K_M.gguf new file mode 100644 index 0000000..553c8e4 --- /dev/null +++ b/InternVL3-2B-Instruct.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e3794bff96ec37c741aab27b5f4787c082a0a6c9460c6932751a8fcd8bf037e +size 923948224 diff --git a/InternVL3-2B-Instruct.i1-Q3_K_S.gguf b/InternVL3-2B-Instruct.i1-Q3_K_S.gguf new file mode 100644 index 0000000..813345d --- /dev/null +++ b/InternVL3-2B-Instruct.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:762c868dc520d263591c93e52cacb49ec158ed75d9037f940867455069831e9f +size 860714176 diff --git a/InternVL3-2B-Instruct.i1-Q4_0.gguf b/InternVL3-2B-Instruct.i1-Q4_0.gguf new file mode 100644 index 0000000..d57013b --- /dev/null +++ b/InternVL3-2B-Instruct.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8ae8283f2c0f630a95cae7cc306e8631addb9ba0753dd5878fa1639ae50ce76 +size 1068246496 diff --git a/InternVL3-2B-Instruct.i1-Q4_1.gguf b/InternVL3-2B-Instruct.i1-Q4_1.gguf new file mode 100644 index 0000000..8f12e6d --- /dev/null +++ b/InternVL3-2B-Instruct.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cde15c1ad2bc9eb1f527166e031b35125860bbe2a750d9485cb6a13bde0af68d +size 1162113952 diff --git a/InternVL3-2B-Instruct.i1-Q4_K_M.gguf b/InternVL3-2B-Instruct.i1-Q4_K_M.gguf new file mode 100644 index 0000000..ba086be --- /dev/null +++ b/InternVL3-2B-Instruct.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11594298914b42593161bf6b00649f59e21b8494ef4b3c2b45b0383e42780224 +size 1116759520 diff --git a/InternVL3-2B-Instruct.i1-Q4_K_S.gguf b/InternVL3-2B-Instruct.i1-Q4_K_S.gguf new file mode 100644 index 0000000..f145fd5 --- /dev/null +++ b/InternVL3-2B-Instruct.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddba0cdb6e27cbc1bdfba5d468ed87a9a6ca9069bc42e30cc5b6fb763e32dc15 +size 1071023584 diff --git a/InternVL3-2B-Instruct.i1-Q5_K_M.gguf b/InternVL3-2B-Instruct.i1-Q5_K_M.gguf new file mode 100644 index 0000000..2167844 --- /dev/null +++ b/InternVL3-2B-Instruct.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20c484f507397c6b52d1a2900d6247f38176cf03b01b6243a1d00feff7966b60 +size 1284882784 diff --git a/InternVL3-2B-Instruct.i1-Q5_K_S.gguf b/InternVL3-2B-Instruct.i1-Q5_K_S.gguf new file mode 100644 index 0000000..ae5b16e --- /dev/null +++ b/InternVL3-2B-Instruct.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8c89fd496a1e068e856a4b9a6c1da6282045ee2cc852a61ec59d541ba468647 +size 1258561888 diff --git a/InternVL3-2B-Instruct.i1-Q6_K.gguf b/InternVL3-2B-Instruct.i1-Q6_K.gguf new file mode 100644 index 0000000..fbe82b5 --- /dev/null +++ b/InternVL3-2B-Instruct.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80857baafacab742ae51e7c719a98ae2d0b79f962e612602ed8ae4bfb4b09815 +size 1463513760 diff --git a/README.md b/README.md new file mode 100644 index 0000000..a1dc040 --- /dev/null +++ b/README.md @@ -0,0 +1,88 @@ +--- +base_model: OpenGVLab/InternVL3-2B-Instruct +language: +- multilingual +library_name: transformers +license: apache-2.0 +license_link: https://huggingface.co/Qwen/Qwen2.5-72B-Instruct/blob/main/LICENSE +license_name: qwen +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- internvl +- custom_code +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/OpenGVLab/InternVL3-2B-Instruct + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#InternVL3-2B-Instruct-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/InternVL3-2B-Instruct-GGUF + +**This is a vision model - mmproj files (if any) will be in the [static repository](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-GGUF).** +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-IQ1_S.gguf) | i1-IQ1_S | 0.6 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-IQ1_M.gguf) | i1-IQ1_M | 0.6 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-IQ2_S.gguf) | i1-IQ2_S | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-IQ2_M.gguf) | i1-IQ2_M | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.8 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-Q2_K.gguf) | i1-Q2_K | 0.9 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-Q3_K_S.gguf) | i1-Q3_K_S | 1.0 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-IQ3_S.gguf) | i1-IQ3_S | 1.0 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-IQ3_M.gguf) | i1-IQ3_M | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.0 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.1 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-IQ4_NL.gguf) | i1-IQ4_NL | 1.2 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-Q4_0.gguf) | i1-Q4_0 | 1.2 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-Q4_K_S.gguf) | i1-Q4_K_S | 1.2 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-Q4_K_M.gguf) | i1-Q4_K_M | 1.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-Q4_1.gguf) | i1-Q4_1 | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-Q5_K_S.gguf) | i1-Q5_K_S | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-Q5_K_M.gguf) | i1-Q5_K_M | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL3-2B-Instruct-i1-GGUF/resolve/main/InternVL3-2B-Instruct.i1-Q6_K.gguf) | i1-Q6_K | 1.6 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..8047290 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e18c4ac0e8bdd56527861cd08a5f5f9f5637044fc10e90686fbc4a07c8403828 +size 2042201