From b62ef371ae9e55f638c4c061be59ff4636ebf9dc Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sat, 18 Apr 2026 20:00:37 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: matrixportalx/layerskip-llama3.2-1B-GGUF Source: Original Platform --- .gitattributes | 48 +++++++++++++++++++++++++++++++ README.md | 43 +++++++++++++++++++++++++++ layerskip-llama3.2-1b.f16.gguf | 3 ++ layerskip-llama3.2-1b.q2_k.gguf | 3 ++ layerskip-llama3.2-1b.q3_k_l.gguf | 3 ++ layerskip-llama3.2-1b.q3_k_m.gguf | 3 ++ layerskip-llama3.2-1b.q3_k_s.gguf | 3 ++ layerskip-llama3.2-1b.q4_0.gguf | 3 ++ layerskip-llama3.2-1b.q4_k_m.gguf | 3 ++ layerskip-llama3.2-1b.q4_k_s.gguf | 3 ++ layerskip-llama3.2-1b.q5_0.gguf | 3 ++ layerskip-llama3.2-1b.q5_k_m.gguf | 3 ++ layerskip-llama3.2-1b.q5_k_s.gguf | 3 ++ layerskip-llama3.2-1b.q6_k.gguf | 3 ++ layerskip-llama3.2-1b.q8_0.gguf | 3 ++ 15 files changed, 130 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 layerskip-llama3.2-1b.f16.gguf create mode 100644 layerskip-llama3.2-1b.q2_k.gguf create mode 100644 layerskip-llama3.2-1b.q3_k_l.gguf create mode 100644 layerskip-llama3.2-1b.q3_k_m.gguf create mode 100644 layerskip-llama3.2-1b.q3_k_s.gguf create mode 100644 layerskip-llama3.2-1b.q4_0.gguf create mode 100644 layerskip-llama3.2-1b.q4_k_m.gguf create mode 100644 layerskip-llama3.2-1b.q4_k_s.gguf create mode 100644 layerskip-llama3.2-1b.q5_0.gguf create mode 100644 layerskip-llama3.2-1b.q5_k_m.gguf create mode 100644 layerskip-llama3.2-1b.q5_k_s.gguf create mode 100644 layerskip-llama3.2-1b.q6_k.gguf create mode 100644 layerskip-llama3.2-1b.q8_0.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..b576653 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,48 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.q2_k.gguf filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.q3_k_s.gguf filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.q3_k_m.gguf filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.q3_k_l.gguf filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.q4_0.gguf filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.q4_k_s.gguf filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.q4_k_m.gguf filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.q5_0.gguf filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.q5_k_s.gguf filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.q5_k_m.gguf filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.q6_k.gguf filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.q8_0.gguf filter=lfs diff=lfs merge=lfs -text +layerskip-llama3.2-1b.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..4bd12eb --- /dev/null +++ b/README.md @@ -0,0 +1,43 @@ +--- +license: llama3.2 +datasets: + - teknium/OpenHermes-2.5 + - NousResearch/hermes-function-calling-v1 +base_model: + - minpeter/QLoRA-Llama-3.2-1B-chatml-tool-v4 + - meta-llama/Llama-3.2-1B +language: + - en +pipeline_tag: text-generation +library_name: transformers +tags: + - axolotl + - merge +--- + +# layerskip-llama3.2-1B GGUF Quantized Models + +## Technical Details +- **Quantization Tool:** llama.cpp +- **Version:** version: 5092 (d3bd7193) + +## Model Information +- **Base Model:** [facebook/layerskip-llama3.2-1B](https://huggingface.co/facebook/layerskip-llama3.2-1B) +- **Quantized by:** [matrixportal](https://huggingface.co/matrixportal) + +## Available Files +- [`layerskip-llama3.2-1b.q2_k.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.q2_k.gguf) (553.96MB) +- [`layerskip-llama3.2-1b.q3_k_s.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.q3_k_s.gguf) (611.96MB) +- [`layerskip-llama3.2-1b.q3_k_m.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.q3_k_m.gguf) (658.84MB) +- [`layerskip-llama3.2-1b.q3_k_l.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.q3_k_l.gguf) (698.59MB) +- [`layerskip-llama3.2-1b.q4_0.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.q4_0.gguf) (735.21MB) +- [`layerskip-llama3.2-1b.q4_k_s.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.q4_k_s.gguf) (739.71MB) +- [`layerskip-llama3.2-1b.q4_k_m.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.q4_k_m.gguf) (770.27MB) +- [`layerskip-llama3.2-1b.q5_0.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.q5_0.gguf) (851.21MB) +- [`layerskip-llama3.2-1b.q5_k_s.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.q5_k_s.gguf) (851.21MB) +- [`layerskip-llama3.2-1b.q5_k_m.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.q5_k_m.gguf) (869.27MB) +- [`layerskip-llama3.2-1b.q6_k.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.q6_k.gguf) (974.46MB) +- [`layerskip-llama3.2-1b.q8_0.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.q8_0.gguf) (1259.88MB) +- [`layerskip-llama3.2-1b.f16.gguf`](https://huggingface.co/matrixportal/layerskip-llama3.2-1B-GGUF/resolve/main/layerskip-llama3.2-1b.f16.gguf) (2364.72MB) + +💡 Q4_K_M provides the best balance for most use cases \ No newline at end of file diff --git a/layerskip-llama3.2-1b.f16.gguf b/layerskip-llama3.2-1b.f16.gguf new file mode 100644 index 0000000..81f93fc --- /dev/null +++ b/layerskip-llama3.2-1b.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02fa0962563428d213a25f68ea32f5b48646200f076331ddc83c70018ccd335d +size 2479591712 diff --git a/layerskip-llama3.2-1b.q2_k.gguf b/layerskip-llama3.2-1b.q2_k.gguf new file mode 100644 index 0000000..202df5a --- /dev/null +++ b/layerskip-llama3.2-1b.q2_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f03f9b134a408ffe6cd6265bb830697b91e8288f24ee26e80e88ae693024b1b +size 580870432 diff --git a/layerskip-llama3.2-1b.q3_k_l.gguf b/layerskip-llama3.2-1b.q3_k_l.gguf new file mode 100644 index 0000000..775ce0b --- /dev/null +++ b/layerskip-llama3.2-1b.q3_k_l.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6efb8bd6a6fac265e6c7b13db9fe96c301fbd91a309dda9841d2707f4c1e2ba +size 732520736 diff --git a/layerskip-llama3.2-1b.q3_k_m.gguf b/layerskip-llama3.2-1b.q3_k_m.gguf new file mode 100644 index 0000000..b694d94 --- /dev/null +++ b/layerskip-llama3.2-1b.q3_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0473d48f48ab7ce68db540c9c44a6967e9be39472a3db95208e4a4f5f4bd80fc +size 690839840 diff --git a/layerskip-llama3.2-1b.q3_k_s.gguf b/layerskip-llama3.2-1b.q3_k_s.gguf new file mode 100644 index 0000000..6daeca3 --- /dev/null +++ b/layerskip-llama3.2-1b.q3_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68862ba2d8614d76bd9768fe505ec2122e11127ab978c48e4369bfa01f02ce1f +size 641687840 diff --git a/layerskip-llama3.2-1b.q4_0.gguf b/layerskip-llama3.2-1b.q4_0.gguf new file mode 100644 index 0000000..9fe9609 --- /dev/null +++ b/layerskip-llama3.2-1b.q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed933b909620413d4f3bf7f5239a108f50c58e9cc5dddf45a30a93ce3b68d425 +size 770924832 diff --git a/layerskip-llama3.2-1b.q4_k_m.gguf b/layerskip-llama3.2-1b.q4_k_m.gguf new file mode 100644 index 0000000..b6b183f --- /dev/null +++ b/layerskip-llama3.2-1b.q4_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc64bc0994871314dd1c4d7e673e293e912f5737e5c91055eeb9ec56cda3f500 +size 807690528 diff --git a/layerskip-llama3.2-1b.q4_k_s.gguf b/layerskip-llama3.2-1b.q4_k_s.gguf new file mode 100644 index 0000000..10e33a3 --- /dev/null +++ b/layerskip-llama3.2-1b.q4_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dd85e335d74ae514e8a3c8c31626bf6a76b3571a55c998d582fe31efd0b831f +size 775643424 diff --git a/layerskip-llama3.2-1b.q5_0.gguf b/layerskip-llama3.2-1b.q5_0.gguf new file mode 100644 index 0000000..4739c61 --- /dev/null +++ b/layerskip-llama3.2-1b.q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2a038ca8f19c1adca04bc66ed39cf2f9df04afaa6b88f492b900d341e85dfba +size 892559648 diff --git a/layerskip-llama3.2-1b.q5_k_m.gguf b/layerskip-llama3.2-1b.q5_k_m.gguf new file mode 100644 index 0000000..bafbee7 --- /dev/null +++ b/layerskip-llama3.2-1b.q5_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c1deb2ced4de01ef1b958d15a8ee5f3cd9b7f4b2041f72e0e09da3d7d42ca6 +size 911499552 diff --git a/layerskip-llama3.2-1b.q5_k_s.gguf b/layerskip-llama3.2-1b.q5_k_s.gguf new file mode 100644 index 0000000..f81769b --- /dev/null +++ b/layerskip-llama3.2-1b.q5_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdb5da05514ba9423cbe5c0abda9e4606696c46b29457df8904ee4508b172fce +size 892559648 diff --git a/layerskip-llama3.2-1b.q6_k.gguf b/layerskip-llama3.2-1b.q6_k.gguf new file mode 100644 index 0000000..2e981a1 --- /dev/null +++ b/layerskip-llama3.2-1b.q6_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb7b3e96da65703fede9dac7fdda3077e0b2c935203ff088409bc6ece01f7507 +size 1021796640 diff --git a/layerskip-llama3.2-1b.q8_0.gguf b/layerskip-llama3.2-1b.q8_0.gguf new file mode 100644 index 0000000..4f9c643 --- /dev/null +++ b/layerskip-llama3.2-1b.q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c1e236750394bf6acf81ad2cbd68e1b4600055b06527e4fe2c4160383cb061e +size 1321079072