commit 0e6d12a94505bca6606a45488404c268cc933542 Author: ModelHub XC Date: Mon Apr 13 18:47:03 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: neopolita/h2o-danube-1.8b-sft-gguf Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..a814e0c --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +h2o-danube-1.8b-sft_q2_k.gguf filter=lfs diff=lfs merge=lfs -text +h2o-danube-1.8b-sft_q3_k_s.gguf filter=lfs diff=lfs merge=lfs -text +h2o-danube-1.8b-sft_q3_k_m.gguf filter=lfs diff=lfs merge=lfs -text +h2o-danube-1.8b-sft_q3_k_l.gguf filter=lfs diff=lfs merge=lfs -text +h2o-danube-1.8b-sft_q4_0.gguf filter=lfs diff=lfs merge=lfs -text +h2o-danube-1.8b-sft_q4_k_s.gguf filter=lfs diff=lfs merge=lfs -text +h2o-danube-1.8b-sft_q4_k_m.gguf filter=lfs diff=lfs merge=lfs -text +h2o-danube-1.8b-sft_q5_0.gguf filter=lfs diff=lfs merge=lfs -text +h2o-danube-1.8b-sft_q5_k_s.gguf filter=lfs diff=lfs merge=lfs -text +h2o-danube-1.8b-sft_q5_k_m.gguf filter=lfs diff=lfs merge=lfs -text +h2o-danube-1.8b-sft_q6_k.gguf filter=lfs diff=lfs merge=lfs -text +h2o-danube-1.8b-sft_q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..1920e41 --- /dev/null +++ b/README.md @@ -0,0 +1,27 @@ +--- +{} +--- +# GGUF quants for [**h2oai/h2o-danube-1.8b-sft**](https://huggingface.co/h2oai/h2o-danube-1.8b-sft) using [llama.cpp](https://github.com/ggerganov/llama.cpp) + +**Terms of Use**: Please check the [**original model**](https://huggingface.co/h2oai/h2o-danube-1.8b-sft) + + +cthulhu + + +## Quants + +* `q2_k`: Uses Q4_K for the attention.vw and feed_forward.w2 tensors, Q2_K for the other tensors. +* `q3_k_s`: Uses Q3_K for all tensors +* `q3_k_m`: Uses Q4_K for the attention.wv, attention.wo, and feed_forward.w2 tensors, else Q3_K +* `q3_k_l`: Uses Q5_K for the attention.wv, attention.wo, and feed_forward.w2 tensors, else Q3_K +* `q4_0`: Original quant method, 4-bit. +* `q4_1`: Higher accuracy than q4_0 but not as high as q5_0. However has quicker inference than q5 models. +* `q4_k_s`: Uses Q4_K for all tensors +* `q4_k_m`: Uses Q6_K for half of the attention.wv and feed_forward.w2 tensors, else Q4_K +* `q5_0`: Higher accuracy, higher resource usage and slower inference. +* `q5_1`: Even higher accuracy, resource usage and slower inference. +* `q5_k_s`: Uses Q5_K for all tensors +* `q5_k_m`: Uses Q6_K for half of the attention.wv and feed_forward.w2 tensors, else Q5_K +* `q6_k`: Uses Q8_K for all tensors +* `q8_0`: Almost indistinguishable from float16. High resource use and slow. Not recommended for most users. \ No newline at end of file diff --git a/h2o-danube-1.8b-sft_q2_k.gguf b/h2o-danube-1.8b-sft_q2_k.gguf new file mode 100644 index 0000000..b9f53cb --- /dev/null +++ b/h2o-danube-1.8b-sft_q2_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:574ffda798ea4949688a82f518afdcffb1dc7d7610c220e12c73c10067c759de +size 710702240 diff --git a/h2o-danube-1.8b-sft_q3_k_l.gguf b/h2o-danube-1.8b-sft_q3_k_l.gguf new file mode 100644 index 0000000..d41868a --- /dev/null +++ b/h2o-danube-1.8b-sft_q3_k_l.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fc08f2aa7c01621cecea83cd00a62504b74b7eac0bbcc99d1582e9e1809153d +size 980203680 diff --git a/h2o-danube-1.8b-sft_q3_k_m.gguf b/h2o-danube-1.8b-sft_q3_k_m.gguf new file mode 100644 index 0000000..65f7c75 --- /dev/null +++ b/h2o-danube-1.8b-sft_q3_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d9f139247a0d1c90d41f704d045d788707c4f9db50a19863850a67cc9a39bf0 +size 905164960 diff --git a/h2o-danube-1.8b-sft_q3_k_s.gguf b/h2o-danube-1.8b-sft_q3_k_s.gguf new file mode 100644 index 0000000..f55c261 --- /dev/null +++ b/h2o-danube-1.8b-sft_q3_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7be5c34516c7dc124f80a3d0674b74057e86dbb8ce56ebeca24f4b18880ea6c +size 820029600 diff --git a/h2o-danube-1.8b-sft_q4_0.gguf b/h2o-danube-1.8b-sft_q4_0.gguf new file mode 100644 index 0000000..306c994 --- /dev/null +++ b/h2o-danube-1.8b-sft_q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e8cf4912b81d356ba220f09b9b3745a546840c3383ca8721cc4499e729cc6bc +size 1052339360 diff --git a/h2o-danube-1.8b-sft_q4_k_m.gguf b/h2o-danube-1.8b-sft_q4_k_m.gguf new file mode 100644 index 0000000..b53d228 --- /dev/null +++ b/h2o-danube-1.8b-sft_q4_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:883c11e185215bd7bbdefc83ae066724a5f651dcaa5dcdb832b73d97a3ae1d7e +size 1112151200 diff --git a/h2o-danube-1.8b-sft_q4_k_s.gguf b/h2o-danube-1.8b-sft_q4_k_s.gguf new file mode 100644 index 0000000..d064bc8 --- /dev/null +++ b/h2o-danube-1.8b-sft_q4_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe8d9474f01c8bb856d9cc8d3a4713e19245929c248f832869d37a9c0850ad1a +size 1059794080 diff --git a/h2o-danube-1.8b-sft_q5_0.gguf b/h2o-danube-1.8b-sft_q5_0.gguf new file mode 100644 index 0000000..9e35f8a --- /dev/null +++ b/h2o-danube-1.8b-sft_q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ba36a042bea644076b1c866f7234d12a5fbc7dadab05a1499cb8a1d17bcfeaa +size 1270983840 diff --git a/h2o-danube-1.8b-sft_q5_k_m.gguf b/h2o-danube-1.8b-sft_q5_k_m.gguf new file mode 100644 index 0000000..3418a31 --- /dev/null +++ b/h2o-danube-1.8b-sft_q5_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a744aca5cb08bac1706461db40c5e817ac8eca168ecc8f84777e39f2446a31c +size 1301796000 diff --git a/h2o-danube-1.8b-sft_q5_k_s.gguf b/h2o-danube-1.8b-sft_q5_k_s.gguf new file mode 100644 index 0000000..ba3179a --- /dev/null +++ b/h2o-danube-1.8b-sft_q5_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb73d40260890c3d14fbc0a51ff0dbedcc6649246a2280138b064457daa25ecd +size 1270983840 diff --git a/h2o-danube-1.8b-sft_q6_k.gguf b/h2o-danube-1.8b-sft_q6_k.gguf new file mode 100644 index 0000000..739028c --- /dev/null +++ b/h2o-danube-1.8b-sft_q6_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:029c17f00d32c4d88a2cce945c8687c8dc5c07cca113d81ea8b0dbcb22f98789 +size 1503293600 diff --git a/h2o-danube-1.8b-sft_q8_0.gguf b/h2o-danube-1.8b-sft_q8_0.gguf new file mode 100644 index 0000000..6ff750f --- /dev/null +++ b/h2o-danube-1.8b-sft_q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46b8f67c3bdb7bc8672d39eaf78d5d50219b37c6d2317863ec645eeaffd25682 +size 1946757280