commit 0c905b9ab7d0e4434d891412bd3c8df3998678e5 Author: ModelHub XC Date: Wed Jun 17 15:27:21 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/internlm2-math-base-7b-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..b9a2f30 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,57 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-base-7b.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..a477af7 --- /dev/null +++ b/README.md @@ -0,0 +1,76 @@ +--- +base_model: internlm/internlm2-math-base-7b +language: +- en +- zh +library_name: transformers +license: other +quantized_by: mradermacher +tags: +- math +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/internlm/internlm2-math-base-7b + + +static quants are available at https://huggingface.co/mradermacher/internlm2-math-base-7b-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-IQ1_S.gguf) | i1-IQ1_S | 2.0 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-IQ1_M.gguf) | i1-IQ1_M | 2.1 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.3 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.6 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-IQ2_S.gguf) | i1-IQ2_S | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-IQ2_M.gguf) | i1-IQ2_M | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-Q2_K.gguf) | i1-Q2_K | 3.1 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.2 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.4 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-IQ3_S.gguf) | i1-IQ3_S | 3.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-IQ3_M.gguf) | i1-IQ3_M | 3.7 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-Q3_K_M.gguf) | i1-Q3_K_M | 3.9 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.2 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.3 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-Q4_0.gguf) | i1-Q4_0 | 4.6 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.6 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-Q4_K_M.gguf) | i1-Q4_K_M | 4.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.5 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.6 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-base-7b-i1-GGUF/resolve/main/internlm2-math-base-7b.i1-Q6_K.gguf) | i1-Q6_K | 6.5 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..7859023 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a71ca02e917705e28d20864190dd982a27e04341b69611e9e2dda1234a24bfe +size 4988157 diff --git a/internlm2-math-base-7b.i1-IQ1_M.gguf b/internlm2-math-base-7b.i1-IQ1_M.gguf new file mode 100644 index 0000000..8b3d11d --- /dev/null +++ b/internlm2-math-base-7b.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96598a7dc8c04065842ba9e982cc07f6a6ff1fca6d68ff99b1b7bf5b9afec426 +size 2007717632 diff --git a/internlm2-math-base-7b.i1-IQ1_S.gguf b/internlm2-math-base-7b.i1-IQ1_S.gguf new file mode 100644 index 0000000..159ddf3 --- /dev/null +++ b/internlm2-math-base-7b.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a653cf8a51a5dffa4acdec672b1ae2b0d7b9e44193a37d94988934994f024b84 +size 1865373440 diff --git a/internlm2-math-base-7b.i1-IQ2_M.gguf b/internlm2-math-base-7b.i1-IQ2_M.gguf new file mode 100644 index 0000000..1c9831b --- /dev/null +++ b/internlm2-math-base-7b.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6cc0d0d7e3a6e672191d233bd27412ac69d6ca54fdb6720ca7e44849e5c9df0 +size 2779170560 diff --git a/internlm2-math-base-7b.i1-IQ2_S.gguf b/internlm2-math-base-7b.i1-IQ2_S.gguf new file mode 100644 index 0000000..f3fdc37 --- /dev/null +++ b/internlm2-math-base-7b.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:247bfbf71be384dd15df11672e2d75b1930d5eaca76959fac294c6dcb109827d +size 2589378304 diff --git a/internlm2-math-base-7b.i1-IQ2_XS.gguf b/internlm2-math-base-7b.i1-IQ2_XS.gguf new file mode 100644 index 0000000..b58f4fb --- /dev/null +++ b/internlm2-math-base-7b.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0710e8e73913f7b0dcc505918ba6adc9a73549a7b5009ced81716368a7204563 +size 2451527424 diff --git a/internlm2-math-base-7b.i1-IQ2_XXS.gguf b/internlm2-math-base-7b.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..9052715 --- /dev/null +++ b/internlm2-math-base-7b.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11325f50a2924b81ea1f1662f4e73dd322c8b46833f2ac46d5b6c5d96d89222a +size 2244957952 diff --git a/internlm2-math-base-7b.i1-IQ3_M.gguf b/internlm2-math-base-7b.i1-IQ3_M.gguf new file mode 100644 index 0000000..7afe1cd --- /dev/null +++ b/internlm2-math-base-7b.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b525231f0def66ffabd3392d7ae6984d25ea21c64f97e36d75bf49e45b1ef7c8 +size 3596285696 diff --git a/internlm2-math-base-7b.i1-IQ3_S.gguf b/internlm2-math-base-7b.i1-IQ3_S.gguf new file mode 100644 index 0000000..7070443 --- /dev/null +++ b/internlm2-math-base-7b.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e42e2e3106c2b65d28d75bfff1e3a6df4083713ddce8eee776bacaac51193b2 +size 3493787392 diff --git a/internlm2-math-base-7b.i1-IQ3_XS.gguf b/internlm2-math-base-7b.i1-IQ3_XS.gguf new file mode 100644 index 0000000..160a4ec --- /dev/null +++ b/internlm2-math-base-7b.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf88892ecd531c6d19de56de7118ac691740aa00ea613856ed4462554f234c7 +size 3330209536 diff --git a/internlm2-math-base-7b.i1-IQ3_XXS.gguf b/internlm2-math-base-7b.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..d786d37 --- /dev/null +++ b/internlm2-math-base-7b.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce5fe1066f6179d114ec0b8ef680518abfc66a7896a229bf9409f035228e66de +size 3105801984 diff --git a/internlm2-math-base-7b.i1-IQ4_XS.gguf b/internlm2-math-base-7b.i1-IQ4_XS.gguf new file mode 100644 index 0000000..760487c --- /dev/null +++ b/internlm2-math-base-7b.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fdd094e426641f0324e08db9683b7a9509f38e7dd65f11e6a89676fb8ec4620 +size 4244268800 diff --git a/internlm2-math-base-7b.i1-Q2_K.gguf b/internlm2-math-base-7b.i1-Q2_K.gguf new file mode 100644 index 0000000..273cd08 --- /dev/null +++ b/internlm2-math-base-7b.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44d6c4155b440e3ad5a58cd4bb7f7ce8e3a41173ded4da6fdf3388c37699faa +size 3005449984 diff --git a/internlm2-math-base-7b.i1-Q3_K_L.gguf b/internlm2-math-base-7b.i1-Q3_K_L.gguf new file mode 100644 index 0000000..e87b412 --- /dev/null +++ b/internlm2-math-base-7b.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01dc8854679375c4dfa18b089d550742c6772711a0674d61df0fbd4d15f344fb +size 4133418752 diff --git a/internlm2-math-base-7b.i1-Q3_K_M.gguf b/internlm2-math-base-7b.i1-Q3_K_M.gguf new file mode 100644 index 0000000..a524347 --- /dev/null +++ b/internlm2-math-base-7b.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ed14381ad27fb73512859ca175255a45010770cee241707dd9b777e363051c +size 3830380288 diff --git a/internlm2-math-base-7b.i1-Q3_K_S.gguf b/internlm2-math-base-7b.i1-Q3_K_S.gguf new file mode 100644 index 0000000..7f51af3 --- /dev/null +++ b/internlm2-math-base-7b.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d5041341a04aabdebcf5ef503c005ad7a53ff3469a0b45f0d53eecb4e0cf041 +size 3475961600 diff --git a/internlm2-math-base-7b.i1-Q4_0.gguf b/internlm2-math-base-7b.i1-Q4_0.gguf new file mode 100644 index 0000000..2942660 --- /dev/null +++ b/internlm2-math-base-7b.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb2325f0d75ecc59580233a98ad5ef738c05825327f469e3c439d939d1c02b73 +size 4467926784 diff --git a/internlm2-math-base-7b.i1-Q4_K_M.gguf b/internlm2-math-base-7b.i1-Q4_K_M.gguf new file mode 100644 index 0000000..cd01d72 --- /dev/null +++ b/internlm2-math-base-7b.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbd6f31a109950f2dcfa94ac7ec06b42d177aadd45334ab12d487009d6e710da +size 4712769280 diff --git a/internlm2-math-base-7b.i1-Q4_K_S.gguf b/internlm2-math-base-7b.i1-Q4_K_S.gguf new file mode 100644 index 0000000..d79ae80 --- /dev/null +++ b/internlm2-math-base-7b.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b04b76fe012c4b453becd3a734e26a8fc2ad6c126e5551da26892d8e21d75bdc +size 4484704000 diff --git a/internlm2-math-base-7b.i1-Q5_K_M.gguf b/internlm2-math-base-7b.i1-Q5_K_M.gguf new file mode 100644 index 0000000..5578701 --- /dev/null +++ b/internlm2-math-base-7b.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72a105712b225d00a0705ba35a8bcad3051bf828eb3bdf41e8b5f67c411028fa +size 5506737920 diff --git a/internlm2-math-base-7b.i1-Q5_K_S.gguf b/internlm2-math-base-7b.i1-Q5_K_S.gguf new file mode 100644 index 0000000..88bb31f --- /dev/null +++ b/internlm2-math-base-7b.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afc248a69c3172785be18b1e4c33638635f7a5b0e9843a52d564b5857878f5a3 +size 5373044480 diff --git a/internlm2-math-base-7b.i1-Q6_K.gguf b/internlm2-math-base-7b.i1-Q6_K.gguf new file mode 100644 index 0000000..30d276e --- /dev/null +++ b/internlm2-math-base-7b.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:637c82da647ad6e60f82dc683f36c0e7f1dfe936a0026fd8dbe2e363270ea44e +size 6350329600