commit 7e69cbe39ded0ece9c9c5bd62fd1b87843891d2c Author: ModelHub XC Date: Sun May 10 04:36:04 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/InternVL2-1B-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..1e65baf --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +InternVL2-1B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/InternVL2-1B.i1-IQ1_M.gguf b/InternVL2-1B.i1-IQ1_M.gguf new file mode 100644 index 0000000..e6fa107 --- /dev/null +++ b/InternVL2-1B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76b4c6fc7c69e1be6eae2998290b3d6de6f0438e32da7b9cec9b775fb2e3d893 +size 394130784 diff --git a/InternVL2-1B.i1-IQ1_S.gguf b/InternVL2-1B.i1-IQ1_S.gguf new file mode 100644 index 0000000..09526f5 --- /dev/null +++ b/InternVL2-1B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3411b2d73410b539b0e4e24017032c0bcd7905ff0762657b15e4f0d940b250c0 +size 391985760 diff --git a/InternVL2-1B.i1-IQ2_M.gguf b/InternVL2-1B.i1-IQ2_M.gguf new file mode 100644 index 0000000..366843d --- /dev/null +++ b/InternVL2-1B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc8d000f7bcc733ce44d26d6a81dc2750ce3b6f5221c7378c648ca751b5d0212 +size 404753760 diff --git a/InternVL2-1B.i1-IQ2_S.gguf b/InternVL2-1B.i1-IQ2_S.gguf new file mode 100644 index 0000000..644a83a --- /dev/null +++ b/InternVL2-1B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88f9593f4640b05e24dc707a8d2c78f6fd645e28b432ee1b69eff5c080632b53 +size 401893728 diff --git a/InternVL2-1B.i1-IQ2_XS.gguf b/InternVL2-1B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..17ec066 --- /dev/null +++ b/InternVL2-1B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7c0817851efd821335d56b689a75843ab3a8139fcd8323f058037aa5e424d5f +size 400565856 diff --git a/InternVL2-1B.i1-IQ2_XXS.gguf b/InternVL2-1B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..ffb2148 --- /dev/null +++ b/InternVL2-1B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5197b6f5392e8298252eeab1a179917b41a2194ea5f4a2843ae22f215d92d996 +size 397705824 diff --git a/InternVL2-1B.i1-IQ3_M.gguf b/InternVL2-1B.i1-IQ3_M.gguf new file mode 100644 index 0000000..d740876 --- /dev/null +++ b/InternVL2-1B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75190f9288288cb0781c9214eac4e6d6edf2844d2419aaeb763cd9c72e11ce77 +size 418908768 diff --git a/InternVL2-1B.i1-IQ3_S.gguf b/InternVL2-1B.i1-IQ3_S.gguf new file mode 100644 index 0000000..4ee8ba7 --- /dev/null +++ b/InternVL2-1B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0083e1e574e7a445f44e6212783d3244db616e128afc147263484c3044d564c +size 414763872 diff --git a/InternVL2-1B.i1-IQ3_XS.gguf b/InternVL2-1B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..53f33b3 --- /dev/null +++ b/InternVL2-1B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ac8d37e1ea7bf3da9669b04a0a7577d12b6770f6531168785365b3e7aff817e +size 414763872 diff --git a/InternVL2-1B.i1-IQ3_XXS.gguf b/InternVL2-1B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..1c0f08f --- /dev/null +++ b/InternVL2-1B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db02770e4f954988d8cd7bf39bc416a3117e68ac87be8ba24ff6e2fc8f6210e1 +size 409860960 diff --git a/InternVL2-1B.i1-IQ4_NL.gguf b/InternVL2-1B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..77af838 --- /dev/null +++ b/InternVL2-1B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deb6800a811200e13722bab40b36c221a03b9a791564da984efc911af5b32049 +size 428827488 diff --git a/InternVL2-1B.i1-IQ4_XS.gguf b/InternVL2-1B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..c2b46af --- /dev/null +++ b/InternVL2-1B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3063c61c4da97bf2a0d74e5b7b8280dc5476109702fb1701c4c43d360655fd1 +size 425558880 diff --git a/InternVL2-1B.i1-Q2_K.gguf b/InternVL2-1B.i1-Q2_K.gguf new file mode 100644 index 0000000..49ad0d2 --- /dev/null +++ b/InternVL2-1B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:968460a127f57854a475514cc554f24a7944c0f570bf677e6efbaa2d1b3280ea +size 414763872 diff --git a/InternVL2-1B.i1-Q2_K_S.gguf b/InternVL2-1B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..1ff04c9 --- /dev/null +++ b/InternVL2-1B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d5b737933e73533a9596234251c19cfc91b17c8d36fd94aac14c16317dda763 +size 407205216 diff --git a/InternVL2-1B.i1-Q3_K_L.gguf b/InternVL2-1B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..9d7ba39 --- /dev/null +++ b/InternVL2-1B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a40489c5da75fc69083c4f23d6ae290a8c42dfb7679aeb69409f528f408203e +size 445514592 diff --git a/InternVL2-1B.i1-Q3_K_M.gguf b/InternVL2-1B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..a96db84 --- /dev/null +++ b/InternVL2-1B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e01ae0fddef0d56f6f052c13c7199ffcb393d5fdb765c84bf9fb502b8812080 +size 431623008 diff --git a/InternVL2-1B.i1-Q3_K_S.gguf b/InternVL2-1B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..d18c655 --- /dev/null +++ b/InternVL2-1B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfa5c5b63fa349f99dfbfcb9140f51272883a325de0321ace788a17cec67906f +size 414419808 diff --git a/InternVL2-1B.i1-Q4_0.gguf b/InternVL2-1B.i1-Q4_0.gguf new file mode 100644 index 0000000..8ad82f4 --- /dev/null +++ b/InternVL2-1B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21ac5d7f62f1e3b13518f86e2e36ebeb97c961ade08884dfe83f44a84a084305 +size 429128544 diff --git a/InternVL2-1B.i1-Q4_1.gguf b/InternVL2-1B.i1-Q4_1.gguf new file mode 100644 index 0000000..747e06d --- /dev/null +++ b/InternVL2-1B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ac0dcf199def568080f50969b72c8fc753acd4de82805601147d7631742bd6 +size 459168224 diff --git a/InternVL2-1B.i1-Q4_K_M.gguf b/InternVL2-1B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..8d6865b --- /dev/null +++ b/InternVL2-1B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:389783fb33c3bf7a9acf7a8e9bb94e607bad4f89dbc2d3dd310735b327be596c +size 490949728 diff --git a/InternVL2-1B.i1-Q4_K_S.gguf b/InternVL2-1B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..c70d003 --- /dev/null +++ b/InternVL2-1B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8482bea61a912d1fd3050572b31dd0efd1ccfeecd49a77d385f3504269e6a603 +size 478613600 diff --git a/InternVL2-1B.i1-Q5_K_M.gguf b/InternVL2-1B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..86434d4 --- /dev/null +++ b/InternVL2-1B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f6c3e00b749a93a5432392ebc34fbf089f14ef75323a3ddff65d05f7ce9cb3 +size 521720544 diff --git a/InternVL2-1B.i1-Q5_K_S.gguf b/InternVL2-1B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..2f90f4f --- /dev/null +++ b/InternVL2-1B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae957035745d81e52e18387a0f2fb475bc74b47ebb1af15dea25467183b531 +size 514344672 diff --git a/InternVL2-1B.i1-Q6_K.gguf b/InternVL2-1B.i1-Q6_K.gguf new file mode 100644 index 0000000..75dd682 --- /dev/null +++ b/InternVL2-1B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58adc733795f20db4745d12c4f52c280d1203686264944ce0f71e3c80ce2bdbc +size 649834400 diff --git a/README.md b/README.md new file mode 100644 index 0000000..d92ae39 --- /dev/null +++ b/README.md @@ -0,0 +1,86 @@ +--- +base_model: OpenGVLab/InternVL2-1B +language: +- multilingual +library_name: transformers +license: mit +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- internvl +- custom_code +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/OpenGVLab/InternVL2-1B + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#InternVL2-1B-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/InternVL2-1B-GGUF + +**This is a vision model - mmproj files (if any) will be in the [static repository](https://huggingface.co/mradermacher/InternVL2-1B-GGUF).** +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-IQ1_S.gguf) | i1-IQ1_S | 0.5 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-IQ1_M.gguf) | i1-IQ1_M | 0.5 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-IQ2_S.gguf) | i1-IQ2_S | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-IQ2_M.gguf) | i1-IQ2_M | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.5 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.5 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 0.5 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-IQ3_S.gguf) | i1-IQ3_S | 0.5 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-Q2_K.gguf) | i1-Q2_K | 0.5 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-IQ3_M.gguf) | i1-IQ3_M | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 0.5 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-Q4_0.gguf) | i1-Q4_0 | 0.5 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 0.5 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 0.5 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-Q4_1.gguf) | i1-Q4_1 | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 0.6 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 0.6 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/InternVL2-1B-i1-GGUF/resolve/main/InternVL2-1B.i1-Q6_K.gguf) | i1-Q6_K | 0.7 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..473f2e5 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37135decf31b9439ec0be10f2afa0af23e4cb9e29e0dfbbd89717fd8ccd2206a +size 988597