From 709061b1dfa0e090ca48628406c74eae67d60ad4 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 12 Jun 2026 04:14:16 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: ibm-granite/granite-guardian-4.1-8b-GGUF Source: Original Platform --- .gitattributes | 50 +++++++++++++++++++++++++++++ README.md | 44 +++++++++++++++++++++++++ granite-guardian-4.1-8b-Q2_K.gguf | 3 ++ granite-guardian-4.1-8b-Q3_K_L.gguf | 3 ++ granite-guardian-4.1-8b-Q3_K_M.gguf | 3 ++ granite-guardian-4.1-8b-Q3_K_S.gguf | 3 ++ granite-guardian-4.1-8b-Q4_0.gguf | 3 ++ granite-guardian-4.1-8b-Q4_1.gguf | 3 ++ granite-guardian-4.1-8b-Q4_K_M.gguf | 3 ++ granite-guardian-4.1-8b-Q4_K_S.gguf | 3 ++ granite-guardian-4.1-8b-Q5_0.gguf | 3 ++ granite-guardian-4.1-8b-Q5_1.gguf | 3 ++ granite-guardian-4.1-8b-Q5_K_M.gguf | 3 ++ granite-guardian-4.1-8b-Q5_K_S.gguf | 3 ++ granite-guardian-4.1-8b-Q6_K.gguf | 3 ++ granite-guardian-4.1-8b-Q8_0.gguf | 3 ++ granite-guardian-4.1-8b-bf16.gguf | 3 ++ 17 files changed, 139 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 granite-guardian-4.1-8b-Q2_K.gguf create mode 100644 granite-guardian-4.1-8b-Q3_K_L.gguf create mode 100644 granite-guardian-4.1-8b-Q3_K_M.gguf create mode 100644 granite-guardian-4.1-8b-Q3_K_S.gguf create mode 100644 granite-guardian-4.1-8b-Q4_0.gguf create mode 100644 granite-guardian-4.1-8b-Q4_1.gguf create mode 100644 granite-guardian-4.1-8b-Q4_K_M.gguf create mode 100644 granite-guardian-4.1-8b-Q4_K_S.gguf create mode 100644 granite-guardian-4.1-8b-Q5_0.gguf create mode 100644 granite-guardian-4.1-8b-Q5_1.gguf create mode 100644 granite-guardian-4.1-8b-Q5_K_M.gguf create mode 100644 granite-guardian-4.1-8b-Q5_K_S.gguf create mode 100644 granite-guardian-4.1-8b-Q6_K.gguf create mode 100644 granite-guardian-4.1-8b-Q8_0.gguf create mode 100644 granite-guardian-4.1-8b-bf16.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..b689389 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,50 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-bf16.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q5_1.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +granite-guardian-4.1-8b-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..2b88b1b --- /dev/null +++ b/README.md @@ -0,0 +1,44 @@ +--- +license: apache-2.0 +language: +- en +pipeline_tag: text-generation +library_name: transformers +base_model: ibm-granite/granite-guardian-4.1-8b +tags: +- granite +- guardian +- safety +- hallucination +- thinking +- tool-calling +- agent +- chat +--- + +> [!NOTE] +> This repository contains models that have been converted to the GGUF format with various quantizations from an IBM Granite base model. +> +> Please reference the base model's full model card here: +> https://huggingface.co/ibm-granite/granite-guardian-4.1-8b + +# Granite Guardian 4.1 8B (GGUF) + +## Model Summary + +**Granite Guardian 4.1 8B** is a specialized safety model fine-tuned from [ibm-granite/granite-4.1-8b](https://huggingface.co/ibm-granite/granite-4.1-8b), designed to judge if the input prompts and the output responses of an LLM-based system meet specified criteria. The model comes pre-baked with certain criteria including but not limited to: jailbreak attempts, profanity, and hallucinations related to tool calls and retrieval augmented generation in agent-based systems. Additionally, the model also allows users to bring their own criteria and tailor the judging behavior to specific use cases. + +This version of Granite Guardian is a hybrid thinking model that allows the user to operate in thinking or non-thinking mode. +In thinking mode, the model produces detailed reasoning traces through ` ... ` and ` ... ` tags. +In non-thinking mode, the model only produces the judgement score through the ` ... ` tags. + +It is trained on unique data comprising human annotations and synthetic data informed by internal red-teaming. +It outperforms other open-source models in the same space on standard benchmarks. + +- **Developers:** IBM Research +- **GitHub Repository:** [ibm-granite/granite-guardian](https://github.com/ibm-granite/granite-guardian) +- **Cookbook:** [Granite Guardian Recipes](https://github.com/ibm-granite/granite-guardian/tree/main/cookbooks/granite-guardian-4.1) +- **Website**: [Granite Guardian Docs](https://www.ibm.com/granite/docs/models/guardian/) +- **Paper:** [Granite Guardian](https://arxiv.org/abs/2412.07724) +- **Release Date**: April, 2026 +- **License:** [Apache 2.0](https://www.apache.org/licenses/LICENSE-2.0) diff --git a/granite-guardian-4.1-8b-Q2_K.gguf b/granite-guardian-4.1-8b-Q2_K.gguf new file mode 100644 index 0000000..9a90e50 --- /dev/null +++ b/granite-guardian-4.1-8b-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:721421b50482b3f844d6e19ed86d21125476a84a8e379c7ea8d07d84ee58a1e8 +size 3277435968 diff --git a/granite-guardian-4.1-8b-Q3_K_L.gguf b/granite-guardian-4.1-8b-Q3_K_L.gguf new file mode 100644 index 0000000..dbc8d3e --- /dev/null +++ b/granite-guardian-4.1-8b-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d14b784fc42261d2f738734f708ce95625488be28da6697fd92047c57118484 +size 4523275328 diff --git a/granite-guardian-4.1-8b-Q3_K_M.gguf b/granite-guardian-4.1-8b-Q3_K_M.gguf new file mode 100644 index 0000000..da42aeb --- /dev/null +++ b/granite-guardian-4.1-8b-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aa82b7d7c2ffba7d0f7f843bec6eca18756bb07c7019254a9925aa2c17ad5b1 +size 4170429504 diff --git a/granite-guardian-4.1-8b-Q3_K_S.gguf b/granite-guardian-4.1-8b-Q3_K_S.gguf new file mode 100644 index 0000000..df82cba --- /dev/null +++ b/granite-guardian-4.1-8b-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d7321ca716bc59edc8b8224a159c81928861fee72a825b290aafdc47192eb78 +size 3766334528 diff --git a/granite-guardian-4.1-8b-Q4_0.gguf b/granite-guardian-4.1-8b-Q4_0.gguf new file mode 100644 index 0000000..0031d6e --- /dev/null +++ b/granite-guardian-4.1-8b-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb58ed2189197e047a6fd2d21fcadbd9c012762653b75a3b8a6c5b7f3096798 +size 4824740928 diff --git a/granite-guardian-4.1-8b-Q4_1.gguf b/granite-guardian-4.1-8b-Q4_1.gguf new file mode 100644 index 0000000..43acf51 --- /dev/null +++ b/granite-guardian-4.1-8b-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c76481f2ef204235a212631d8d19c4b3c25d8ecbadbc75e928f15f5b9f9569fc +size 5322814528 diff --git a/granite-guardian-4.1-8b-Q4_K_M.gguf b/granite-guardian-4.1-8b-Q4_K_M.gguf new file mode 100644 index 0000000..a3ca418 --- /dev/null +++ b/granite-guardian-4.1-8b-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:979114c9e6a589a1e37c2d597677555d3eb78c2856e920ed4ec97f7bded787a4 +size 5116703808 diff --git a/granite-guardian-4.1-8b-Q4_K_S.gguf b/granite-guardian-4.1-8b-Q4_K_S.gguf new file mode 100644 index 0000000..6439369 --- /dev/null +++ b/granite-guardian-4.1-8b-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f713dd826ef87bb9243b03f649051eacb31c39a6f4b4f7f4b4d3e491c3bcbadf +size 4859606080 diff --git a/granite-guardian-4.1-8b-Q5_0.gguf b/granite-guardian-4.1-8b-Q5_0.gguf new file mode 100644 index 0000000..248ddb3 --- /dev/null +++ b/granite-guardian-4.1-8b-Q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efc9695e6e2671d89ab425b31af27fec6f53ad5e445d7eebecb254398c835a98 +size 5820888128 diff --git a/granite-guardian-4.1-8b-Q5_1.gguf b/granite-guardian-4.1-8b-Q5_1.gguf new file mode 100644 index 0000000..d52d92c --- /dev/null +++ b/granite-guardian-4.1-8b-Q5_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0290ebe906fe0090edf2daab7763c8e5cffec3f9605a6643830278c6d86853f4 +size 6318961728 diff --git a/granite-guardian-4.1-8b-Q5_K_M.gguf b/granite-guardian-4.1-8b-Q5_K_M.gguf new file mode 100644 index 0000000..123c043 --- /dev/null +++ b/granite-guardian-4.1-8b-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb6aa91e991822559583f77d40c860027f856a7f79fe1c6c3c3c35b97c838a5 +size 5971293248 diff --git a/granite-guardian-4.1-8b-Q5_K_S.gguf b/granite-guardian-4.1-8b-Q5_K_S.gguf new file mode 100644 index 0000000..c759d84 --- /dev/null +++ b/granite-guardian-4.1-8b-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c647bad1dba0249f5e031b1f6355228b5d312498e8c603c8499f398db82b4eaa +size 5820888128 diff --git a/granite-guardian-4.1-8b-Q6_K.gguf b/granite-guardian-4.1-8b-Q6_K.gguf new file mode 100644 index 0000000..e690101 --- /dev/null +++ b/granite-guardian-4.1-8b-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0061355a4ef83a8f2bd1c39012b6c013c7679ab658b3845a64f39b5c52ada488 +size 6879294528 diff --git a/granite-guardian-4.1-8b-Q8_0.gguf b/granite-guardian-4.1-8b-Q8_0.gguf new file mode 100644 index 0000000..ba1414c --- /dev/null +++ b/granite-guardian-4.1-8b-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93d078a5f8a1e678a9acd75cafdfa67d90fbf6d3c194c308c57808c8d4e2ac23 +size 8908878912 diff --git a/granite-guardian-4.1-8b-bf16.gguf b/granite-guardian-4.1-8b-bf16.gguf new file mode 100644 index 0000000..09837a5 --- /dev/null +++ b/granite-guardian-4.1-8b-bf16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2547a19610fd5c0678c10992f10ef465508ac457e8fb26537267e168f84e564b +size 16765334592