From f848f9eba39d2c2e46c5d450297121dbcd9faceb Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 19 Jun 2026 05:58:16 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: Avtrkrb/granite-claude-h-350m-GGUF Source: Original Platform --- .gitattributes | 41 ++++++++++++++ README.md | 88 +++++++++++++++++++++++++++++++ granite-claude-h-350m-F16.gguf | 3 ++ granite-claude-h-350m-Q4_0.gguf | 3 ++ granite-claude-h-350m-Q4_K_M.gguf | 3 ++ granite-claude-h-350m-Q5_K_M.gguf | 3 ++ granite-claude-h-350m-Q6_K.gguf | 3 ++ granite-claude-h-350m-Q8_0.gguf | 3 ++ 8 files changed, 147 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 granite-claude-h-350m-F16.gguf create mode 100644 granite-claude-h-350m-Q4_0.gguf create mode 100644 granite-claude-h-350m-Q4_K_M.gguf create mode 100644 granite-claude-h-350m-Q5_K_M.gguf create mode 100644 granite-claude-h-350m-Q6_K.gguf create mode 100644 granite-claude-h-350m-Q8_0.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..dceac25 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,41 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +granite-claude-h-350m-F16.gguf filter=lfs diff=lfs merge=lfs -text +granite-claude-h-350m-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +granite-claude-h-350m-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +granite-claude-h-350m-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +granite-claude-h-350m-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +granite-claude-h-350m-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..411bd76 --- /dev/null +++ b/README.md @@ -0,0 +1,88 @@ +--- +license: apache-2.0 +language: + - en +pipeline_tag: text-generation +tags: + - granite + - gguf + - llama-cpp + - reasoning + - quantized + - local-llm + +base_model: Avtrkrb/granite-claude-h-350m + +library_name: gguf +--- + +# granite-claude-h-350m-GGUF + +GGUF quantizations of: + +`Avtrkrb/granite-claude-h-350m` + +These files are intended for inference using: + +- llama.cpp +- LM Studio +- Open WebUI +- Jan +- KoboldCpp +- GPT4All +- Ollama (after conversion/import) + +--- + +## Available Quantizations + +Typical variants included: + +| Quant | Use Case | +|---------|---------| +| Q4_K_M | Best size / quality balance | +| Q5_K_M | Higher quality | +| Q6_K | Near-lossless for most use cases | +| Q8_0 | Highest quality quantized version | + +--- + +## Source Model + +Merged model: + +https://huggingface.co/Avtrkrb/granite-claude-h-350m + +Dataset: + +https://huggingface.co/datasets/Avtrkrb/combined-reasoning-claude + +--- + +## Example llama.cpp Usage + +```bash +./llama-cli \ + -m granite-claude-h-350m-Q4_K_M.gguf \ + -p "Explain quantum tunneling." +``` + +--- + +## Recommended Quant + +For most users: + +**Q4_K_M** + +offers the best balance between: + +- quality +- speed +- memory usage + +--- + +## License + +This repository follows the licensing terms of the original Granite model. \ No newline at end of file diff --git a/granite-claude-h-350m-F16.gguf b/granite-claude-h-350m-F16.gguf new file mode 100644 index 0000000..fd2c938 --- /dev/null +++ b/granite-claude-h-350m-F16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd9e51ad0dbfea07a979e6bb33d6ab42ed19a362a03a3e12da1ef7ffa7a96b79 +size 839072288 diff --git a/granite-claude-h-350m-Q4_0.gguf b/granite-claude-h-350m-Q4_0.gguf new file mode 100644 index 0000000..d2e8437 --- /dev/null +++ b/granite-claude-h-350m-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b0260502a3f5d0c53740592e974c736e82147f1aa6dc6f50f7f77e1ff6b8220 +size 259425600 diff --git a/granite-claude-h-350m-Q4_K_M.gguf b/granite-claude-h-350m-Q4_K_M.gguf new file mode 100644 index 0000000..898b921 --- /dev/null +++ b/granite-claude-h-350m-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53f3855ea5bcea3583a66f1369a27d261b58ed0b64850a44a56a2981eb39b3c2 +size 266015040 diff --git a/granite-claude-h-350m-Q5_K_M.gguf b/granite-claude-h-350m-Q5_K_M.gguf new file mode 100644 index 0000000..927a82a --- /dev/null +++ b/granite-claude-h-350m-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7926fd19c8ee4317483946de215c9e6437c9060624842e3deeef7d48274fef8 +size 305318208 diff --git a/granite-claude-h-350m-Q6_K.gguf b/granite-claude-h-350m-Q6_K.gguf new file mode 100644 index 0000000..0e16fff --- /dev/null +++ b/granite-claude-h-350m-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92d1596c0047ce3681ae80e1993429261177eb4ddb8e6b4bf3e850498f173370 +size 347077824 diff --git a/granite-claude-h-350m-Q8_0.gguf b/granite-claude-h-350m-Q8_0.gguf new file mode 100644 index 0000000..1c4f0cf --- /dev/null +++ b/granite-claude-h-350m-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b33768b9eb9c0a34b2dcdc02d8afc391cd8d65c6b3cdeca6ba080798d4a4d4a +size 448083264