commit 113fb50b558ed12421b1d91fd04e1e2ecdd28f84 Author: ModelHub XC Date: Wed Jun 17 16:38:16 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: ibm-granite/granite-4.1-30b-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..c105ebd --- /dev/null +++ b/.gitattributes @@ -0,0 +1,54 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q5_1.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-bf16-00001-of-00005.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-bf16-00002-of-00005.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-bf16-00003-of-00005.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-bf16-00004-of-00005.gguf filter=lfs diff=lfs merge=lfs -text +granite-4.1-30b-bf16-00005-of-00005.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..5b0061e --- /dev/null +++ b/README.md @@ -0,0 +1,31 @@ +--- +pipeline_tag: text-generation +inference: false +license: apache-2.0 +library_name: transformers +tags: +- language +- granite-4.1 +- gguf +base_model: +- ibm-granite/granite-4.1-30b +--- + +> [!NOTE] +> This repository contains models that have been converted to the GGUF format with various quantizations from an IBM Granite `.safetensors` model. +> +> Please reference the base model's full model card here: +> https://huggingface.co/ibm-granite/granite-4.1-30b + +### Merging the `.bf16` model + +The `bf16` model had to be split into multiple files to accommodate single file size restrictions +using the `llama-gguf-split` tool, with its default `--split` settings, which can be built from the [ggml-org/llama.cpp](https://github.com/ggml-org/llama.cpp) project. + +Use the following command to merge the split files which points to the first file in the sequence: + +```bash +llama-gguf-split --merge granite-4.1-30b-bf16-00001-of-00005.gguf granite-4.1-30b-bf16.gguf +``` + +The remaining split filenames are inferred by the tool based upon the `00001-of-0000x` naming convention. diff --git a/granite-4.1-30b-Q2_K.gguf b/granite-4.1-30b-Q2_K.gguf new file mode 100644 index 0000000..dbc8b4f --- /dev/null +++ b/granite-4.1-30b-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81fca9861ca64ad59630abe131699403fbc8b4710f998c1be4b3ef99c9cc101c +size 10723779808 diff --git a/granite-4.1-30b-Q3_K_L.gguf b/granite-4.1-30b-Q3_K_L.gguf new file mode 100644 index 0000000..7965f12 --- /dev/null +++ b/granite-4.1-30b-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb38ec12c092a13f6511952977c5c750df6f8e2c809b2ce2e8b0814a2ebba300 +size 15129896160 diff --git a/granite-4.1-30b-Q3_K_M.gguf b/granite-4.1-30b-Q3_K_M.gguf new file mode 100644 index 0000000..e10d46c --- /dev/null +++ b/granite-4.1-30b-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc70d78a721ea39c14c42d44539904e6211e8f6a1fd20902ae7160946df7bccd +size 13956539616 diff --git a/granite-4.1-30b-Q3_K_S.gguf b/granite-4.1-30b-Q3_K_S.gguf new file mode 100644 index 0000000..748f69d --- /dev/null +++ b/granite-4.1-30b-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a807f6ea95a69a2e159978299fcbb310c14307cbaaa2a64cbb18b7fc7a087df3 +size 12569273568 diff --git a/granite-4.1-30b-Q4_0.gguf b/granite-4.1-30b-Q4_0.gguf new file mode 100644 index 0000000..65ecbdf --- /dev/null +++ b/granite-4.1-30b-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03796ec23dc280304a32e7db5e82e13225786e5ae7c2441cef0ada4afa2dc8a6 +size 16348341472 diff --git a/granite-4.1-30b-Q4_1.gguf b/granite-4.1-30b-Q4_1.gguf new file mode 100644 index 0000000..e0eb1ad --- /dev/null +++ b/granite-4.1-30b-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c354f0c53be963ce5fbf6009d360b9ec8707b9daf825387f23f5c945b95d1799 +size 18126726368 diff --git a/granite-4.1-30b-Q4_K_M.gguf b/granite-4.1-30b-Q4_K_M.gguf new file mode 100644 index 0000000..e3fb18b --- /dev/null +++ b/granite-4.1-30b-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b33e4376e3581d11236ea53ced6b38399f6e91c0a391488486dc0827972f23f6 +size 17490240736 diff --git a/granite-4.1-30b-Q4_K_S.gguf b/granite-4.1-30b-Q4_K_S.gguf new file mode 100644 index 0000000..af3f2b9 --- /dev/null +++ b/granite-4.1-30b-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c53f0adb8c7479ed73e8445aeb7f23494bd109ae248cb74af0ae482eb6d53b59 +size 16484656352 diff --git a/granite-4.1-30b-Q5_0.gguf b/granite-4.1-30b-Q5_0.gguf new file mode 100644 index 0000000..618148c --- /dev/null +++ b/granite-4.1-30b-Q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e7b9b8bd24bcff3015fcfb125d910303d8ad3e017aee086fd6d286e7cd8e480 +size 19905111264 diff --git a/granite-4.1-30b-Q5_1.gguf b/granite-4.1-30b-Q5_1.gguf new file mode 100644 index 0000000..1cbf6ba --- /dev/null +++ b/granite-4.1-30b-Q5_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c6d6df1d5063fbd6021c26955ebd2d42a30b12fcf1e2addac64fd5458400bf6 +size 21683496160 diff --git a/granite-4.1-30b-Q5_K_M.gguf b/granite-4.1-30b-Q5_K_M.gguf new file mode 100644 index 0000000..9b1f74f --- /dev/null +++ b/granite-4.1-30b-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90011962485021b2836e7476c1697f57e4ba041898e8a81dd4123cbe1b8d2340 +size 20493362400 diff --git a/granite-4.1-30b-Q5_K_S.gguf b/granite-4.1-30b-Q5_K_S.gguf new file mode 100644 index 0000000..fd27041 --- /dev/null +++ b/granite-4.1-30b-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:042ed3eb174a7fca1f8304f7501f64495cadcc36cd8fd474079d83f9c2e856eb +size 19905111264 diff --git a/granite-4.1-30b-Q6_K.gguf b/granite-4.1-30b-Q6_K.gguf new file mode 100644 index 0000000..13f2bc5 --- /dev/null +++ b/granite-4.1-30b-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:182f89335e9b891b799230f496af5bd1f1dfff97e79bab424776b2d65766b53b +size 23684179168 diff --git a/granite-4.1-30b-Q8_0.gguf b/granite-4.1-30b-Q8_0.gguf new file mode 100644 index 0000000..202811c --- /dev/null +++ b/granite-4.1-30b-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f772a60949ab40144bca249a5a38f7fa530d6b6649c14b8b6395c4cd64ef396 +size 30674969824 diff --git a/granite-4.1-30b-bf16-00001-of-00005.gguf b/granite-4.1-30b-bf16-00001-of-00005.gguf new file mode 100644 index 0000000..b1dc6df --- /dev/null +++ b/granite-4.1-30b-bf16-00001-of-00005.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f18308307d43cfbfd27cc77522781b55b34067291c13a8fc6044bdad78b0e11 +size 13274807328 diff --git a/granite-4.1-30b-bf16-00002-of-00005.gguf b/granite-4.1-30b-bf16-00002-of-00005.gguf new file mode 100644 index 0000000..2a8b71f --- /dev/null +++ b/granite-4.1-30b-bf16-00002-of-00005.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d52920fb850451336032283497d708a9c1e070b3da594518d94bc34b862f6ac7 +size 12986031712 diff --git a/granite-4.1-30b-bf16-00003-of-00005.gguf b/granite-4.1-30b-bf16-00003-of-00005.gguf new file mode 100644 index 0000000..a07668c --- /dev/null +++ b/granite-4.1-30b-bf16-00003-of-00005.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d078bf53a5a8fddd7c0873fdd1584c187444ff539fb45e7e48e6ffe3b59ef7 +size 12717612640 diff --git a/granite-4.1-30b-bf16-00004-of-00005.gguf b/granite-4.1-30b-bf16-00004-of-00005.gguf new file mode 100644 index 0000000..8ca4648 --- /dev/null +++ b/granite-4.1-30b-bf16-00004-of-00005.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b38733f6dd2a49a051193316890cfb66fede7a7b202355bab37627563dee7e61 +size 12491103840 diff --git a/granite-4.1-30b-bf16-00005-of-00005.gguf b/granite-4.1-30b-bf16-00005-of-00005.gguf new file mode 100644 index 0000000..68675e0 --- /dev/null +++ b/granite-4.1-30b-bf16-00005-of-00005.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7a0ac5b3b9930c03b4cbe80be384b6a207c5bb3b49ae736d662eb6adeb92191 +size 6266540000