commit 82ae073a3fe78081690d7ae446c8808b2f995255 Author: ModelHub XC Date: Wed Jun 17 14:53:15 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/internlm2-math-7b-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..2f5a587 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,57 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +internlm2-math-7b.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..a019724 --- /dev/null +++ b/README.md @@ -0,0 +1,76 @@ +--- +base_model: internlm/internlm2-math-7b +language: +- en +- zh +library_name: transformers +license: other +quantized_by: mradermacher +tags: +- math +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/internlm/internlm2-math-7b + + +static quants are available at https://huggingface.co/mradermacher/internlm2-math-7b-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-IQ1_S.gguf) | i1-IQ1_S | 2.0 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-IQ1_M.gguf) | i1-IQ1_M | 2.1 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.3 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.6 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-IQ2_S.gguf) | i1-IQ2_S | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-IQ2_M.gguf) | i1-IQ2_M | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-Q2_K.gguf) | i1-Q2_K | 3.1 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.2 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.4 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-IQ3_S.gguf) | i1-IQ3_S | 3.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-IQ3_M.gguf) | i1-IQ3_M | 3.7 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-Q3_K_M.gguf) | i1-Q3_K_M | 3.9 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.2 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.3 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-Q4_0.gguf) | i1-Q4_0 | 4.6 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.6 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-Q4_K_M.gguf) | i1-Q4_K_M | 4.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.5 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.6 | | +| [GGUF](https://huggingface.co/mradermacher/internlm2-math-7b-i1-GGUF/resolve/main/internlm2-math-7b.i1-Q6_K.gguf) | i1-Q6_K | 6.5 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..16fda5e --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4b36c751fe7552fff26dd936285275e964c021daab97b89482447fc1d577582 +size 4988157 diff --git a/internlm2-math-7b.i1-IQ1_M.gguf b/internlm2-math-7b.i1-IQ1_M.gguf new file mode 100644 index 0000000..31b9d94 --- /dev/null +++ b/internlm2-math-7b.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e1ffee28e844bd0145be60004e8ff2e4541128b6045ebec1a3e6c91955c7212 +size 2007717600 diff --git a/internlm2-math-7b.i1-IQ1_S.gguf b/internlm2-math-7b.i1-IQ1_S.gguf new file mode 100644 index 0000000..2ada366 --- /dev/null +++ b/internlm2-math-7b.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f1c64c80057ee4d5bdd4a587dca6e0de7cb792b66aefe06c66d26c6451fc90d +size 1865373408 diff --git a/internlm2-math-7b.i1-IQ2_M.gguf b/internlm2-math-7b.i1-IQ2_M.gguf new file mode 100644 index 0000000..0e7a5c7 --- /dev/null +++ b/internlm2-math-7b.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78195eb7e5cde9627cb99c30f17a4e5ebd3f6e5841ccf9f4b8074e0b011fdc67 +size 2779170528 diff --git a/internlm2-math-7b.i1-IQ2_S.gguf b/internlm2-math-7b.i1-IQ2_S.gguf new file mode 100644 index 0000000..c28d99a --- /dev/null +++ b/internlm2-math-7b.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3592184e89634d38ff9261f3146cde7dbbf0d362db9af5aff0ba757180ab1d01 +size 2589378272 diff --git a/internlm2-math-7b.i1-IQ2_XS.gguf b/internlm2-math-7b.i1-IQ2_XS.gguf new file mode 100644 index 0000000..5cc2e31 --- /dev/null +++ b/internlm2-math-7b.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06b1d1ec06411824147fe216e07d5de1d0920f6aef1ec7109eb2a97512e2133c +size 2451527392 diff --git a/internlm2-math-7b.i1-IQ2_XXS.gguf b/internlm2-math-7b.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..dbf5b7d --- /dev/null +++ b/internlm2-math-7b.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1018834c2a84e061b39a292998c3fb7bde85ddf403fdfd36991ab16177c7f97d +size 2244957920 diff --git a/internlm2-math-7b.i1-IQ3_M.gguf b/internlm2-math-7b.i1-IQ3_M.gguf new file mode 100644 index 0000000..722f8c5 --- /dev/null +++ b/internlm2-math-7b.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce121d01a1ffda62182cd54e38620318791b32eb8200b184d00ca67d468efa9b +size 3596285664 diff --git a/internlm2-math-7b.i1-IQ3_S.gguf b/internlm2-math-7b.i1-IQ3_S.gguf new file mode 100644 index 0000000..adbddef --- /dev/null +++ b/internlm2-math-7b.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32a74defd15c0daa76d0140655cce11383bda5aeff945bb70387fc5016e2b71d +size 3493787360 diff --git a/internlm2-math-7b.i1-IQ3_XS.gguf b/internlm2-math-7b.i1-IQ3_XS.gguf new file mode 100644 index 0000000..9bd52e9 --- /dev/null +++ b/internlm2-math-7b.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c840dc20e0aca8d402f5953d04fed9d55a3b46fcf0d913215eed0fd9f61cffd +size 3330209504 diff --git a/internlm2-math-7b.i1-IQ3_XXS.gguf b/internlm2-math-7b.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..38f1d6c --- /dev/null +++ b/internlm2-math-7b.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:454b4f4000106e558b888e0eafab8357def8a5185ecd6a45e19ca5dbaa3d7913 +size 3105801952 diff --git a/internlm2-math-7b.i1-IQ4_XS.gguf b/internlm2-math-7b.i1-IQ4_XS.gguf new file mode 100644 index 0000000..628453c --- /dev/null +++ b/internlm2-math-7b.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4361d75a167832b462b3dbd4d1dd513b16d653e1ac20b0e4286b2721eeeddfef +size 4244268768 diff --git a/internlm2-math-7b.i1-Q2_K.gguf b/internlm2-math-7b.i1-Q2_K.gguf new file mode 100644 index 0000000..4866c54 --- /dev/null +++ b/internlm2-math-7b.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c384fab78b00669f76d8b6ad6f9cb2100cd81f9624db1ca0b49898d8f07510b +size 3005449952 diff --git a/internlm2-math-7b.i1-Q3_K_L.gguf b/internlm2-math-7b.i1-Q3_K_L.gguf new file mode 100644 index 0000000..04a46ef --- /dev/null +++ b/internlm2-math-7b.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83da9e29a07326bc56f7abbc6f73b50a2da3947e96ef69331139d563c83ec162 +size 4133418720 diff --git a/internlm2-math-7b.i1-Q3_K_M.gguf b/internlm2-math-7b.i1-Q3_K_M.gguf new file mode 100644 index 0000000..5e2c4a5 --- /dev/null +++ b/internlm2-math-7b.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b812e15978b7f4f5fc640999eefe8c66eb502c34833681aef51d1dab91483e6 +size 3830380256 diff --git a/internlm2-math-7b.i1-Q3_K_S.gguf b/internlm2-math-7b.i1-Q3_K_S.gguf new file mode 100644 index 0000000..21ddaa7 --- /dev/null +++ b/internlm2-math-7b.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e9805c966ee7e360ce642f4c8b9a73ce0fd23f256f8d1fad4b7568b629c79f2 +size 3475961568 diff --git a/internlm2-math-7b.i1-Q4_0.gguf b/internlm2-math-7b.i1-Q4_0.gguf new file mode 100644 index 0000000..38c93b6 --- /dev/null +++ b/internlm2-math-7b.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:858f4729ecf198f8143e7217e953349371688f6d604ccafbddbe9079503f95b9 +size 4467926752 diff --git a/internlm2-math-7b.i1-Q4_K_M.gguf b/internlm2-math-7b.i1-Q4_K_M.gguf new file mode 100644 index 0000000..a90c408 --- /dev/null +++ b/internlm2-math-7b.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef585157493715401a42b2ee05c76f211fbf8b65ac1493c692f54fc2dc8a4489 +size 4712769248 diff --git a/internlm2-math-7b.i1-Q4_K_S.gguf b/internlm2-math-7b.i1-Q4_K_S.gguf new file mode 100644 index 0000000..f8c08e4 --- /dev/null +++ b/internlm2-math-7b.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf5ffb7d6fa37c595bd932a5235086f72b2bd0b6869137fdc6bb0846978e5c7 +size 4484703968 diff --git a/internlm2-math-7b.i1-Q5_K_M.gguf b/internlm2-math-7b.i1-Q5_K_M.gguf new file mode 100644 index 0000000..90091ea --- /dev/null +++ b/internlm2-math-7b.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:548d2317d266df438809b56542237d273a34a1a5b9ab9ef884aae0f9da127ec1 +size 5506737888 diff --git a/internlm2-math-7b.i1-Q5_K_S.gguf b/internlm2-math-7b.i1-Q5_K_S.gguf new file mode 100644 index 0000000..7062d3c --- /dev/null +++ b/internlm2-math-7b.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6b3f425917c7429ded3736e658a6971b7c2d7748ad3fcde6a177a8ecbabef0a +size 5373044448 diff --git a/internlm2-math-7b.i1-Q6_K.gguf b/internlm2-math-7b.i1-Q6_K.gguf new file mode 100644 index 0000000..4ab7288 --- /dev/null +++ b/internlm2-math-7b.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d84497b8ef941edcf3dfce9a2aeccad810c21561d06345482115e66f4d5ee43d +size 6350329568