commit f848f9eba39d2c2e46c5d450297121dbcd9faceb Author: ModelHub XC Date: Fri Jun 19 05:58:16 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: Avtrkrb/granite-claude-h-350m-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..dceac25 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,41 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +granite-claude-h-350m-F16.gguf filter=lfs diff=lfs merge=lfs -text +granite-claude-h-350m-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +granite-claude-h-350m-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +granite-claude-h-350m-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +granite-claude-h-350m-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +granite-claude-h-350m-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..411bd76 --- /dev/null +++ b/README.md @@ -0,0 +1,88 @@ +--- +license: apache-2.0 +language: + - en +pipeline_tag: text-generation +tags: + - granite + - gguf + - llama-cpp + - reasoning + - quantized + - local-llm + +base_model: Avtrkrb/granite-claude-h-350m + +library_name: gguf +--- + +# granite-claude-h-350m-GGUF + +GGUF quantizations of: + +`Avtrkrb/granite-claude-h-350m` + +These files are intended for inference using: + +- llama.cpp +- LM Studio +- Open WebUI +- Jan +- KoboldCpp +- GPT4All +- Ollama (after conversion/import) + +--- + +## Available Quantizations + +Typical variants included: + +| Quant | Use Case | +|---------|---------| +| Q4_K_M | Best size / quality balance | +| Q5_K_M | Higher quality | +| Q6_K | Near-lossless for most use cases | +| Q8_0 | Highest quality quantized version | + +--- + +## Source Model + +Merged model: + +https://huggingface.co/Avtrkrb/granite-claude-h-350m + +Dataset: + +https://huggingface.co/datasets/Avtrkrb/combined-reasoning-claude + +--- + +## Example llama.cpp Usage + +```bash +./llama-cli \ + -m granite-claude-h-350m-Q4_K_M.gguf \ + -p "Explain quantum tunneling." +``` + +--- + +## Recommended Quant + +For most users: + +**Q4_K_M** + +offers the best balance between: + +- quality +- speed +- memory usage + +--- + +## License + +This repository follows the licensing terms of the original Granite model. \ No newline at end of file diff --git a/granite-claude-h-350m-F16.gguf b/granite-claude-h-350m-F16.gguf new file mode 100644 index 0000000..fd2c938 --- /dev/null +++ b/granite-claude-h-350m-F16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd9e51ad0dbfea07a979e6bb33d6ab42ed19a362a03a3e12da1ef7ffa7a96b79 +size 839072288 diff --git a/granite-claude-h-350m-Q4_0.gguf b/granite-claude-h-350m-Q4_0.gguf new file mode 100644 index 0000000..d2e8437 --- /dev/null +++ b/granite-claude-h-350m-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b0260502a3f5d0c53740592e974c736e82147f1aa6dc6f50f7f77e1ff6b8220 +size 259425600 diff --git a/granite-claude-h-350m-Q4_K_M.gguf b/granite-claude-h-350m-Q4_K_M.gguf new file mode 100644 index 0000000..898b921 --- /dev/null +++ b/granite-claude-h-350m-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53f3855ea5bcea3583a66f1369a27d261b58ed0b64850a44a56a2981eb39b3c2 +size 266015040 diff --git a/granite-claude-h-350m-Q5_K_M.gguf b/granite-claude-h-350m-Q5_K_M.gguf new file mode 100644 index 0000000..927a82a --- /dev/null +++ b/granite-claude-h-350m-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7926fd19c8ee4317483946de215c9e6437c9060624842e3deeef7d48274fef8 +size 305318208 diff --git a/granite-claude-h-350m-Q6_K.gguf b/granite-claude-h-350m-Q6_K.gguf new file mode 100644 index 0000000..0e16fff --- /dev/null +++ b/granite-claude-h-350m-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92d1596c0047ce3681ae80e1993429261177eb4ddb8e6b4bf3e850498f173370 +size 347077824 diff --git a/granite-claude-h-350m-Q8_0.gguf b/granite-claude-h-350m-Q8_0.gguf new file mode 100644 index 0000000..1c4f0cf --- /dev/null +++ b/granite-claude-h-350m-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b33768b9eb9c0a34b2dcdc02d8afc391cd8d65c6b3cdeca6ba080798d4a4d4a +size 448083264