commit 3f2cfb298cd0744593ce17880415fc9db2ae47bb Author: ModelHub XC Date: Fri May 8 21:11:55 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: featherless-ai-quants/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..4d526e7 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +featherless-quants.png filter=lfs diff=lfs merge=lfs -text +xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..f05c307 --- /dev/null +++ b/README.md @@ -0,0 +1,47 @@ +--- +base_model: xw17/TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3 +pipeline_tag: text-generation +quantized_by: featherless-ai-quants +--- + +# xw17/TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3 GGUF Quantizations 🚀 + +![Featherless AI Quants](./featherless-quants.png) + +*Optimized GGUF quantization files for enhanced model performance* + +> Powered by [Featherless AI](https://featherless.ai) - run any model you'd like for a simple small fee. +--- + +## Available Quantizations 📊 + +| Quantization Type | File | Size | +|-------------------|------|------| +| IQ4_XS | [xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-IQ4_XS.gguf](https://huggingface.co/featherless-ai-quants/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-GGUF/blob/main/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-IQ4_XS.gguf) | 581.56 MB | +| Q2_K | [xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q2_K.gguf](https://huggingface.co/featherless-ai-quants/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-GGUF/blob/main/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q2_K.gguf) | 412.11 MB | +| Q3_K_L | [xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_L.gguf](https://huggingface.co/featherless-ai-quants/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-GGUF/blob/main/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_L.gguf) | 564.12 MB | +| Q3_K_M | [xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_M.gguf](https://huggingface.co/featherless-ai-quants/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-GGUF/blob/main/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_M.gguf) | 523.00 MB | +| Q3_K_S | [xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_S.gguf](https://huggingface.co/featherless-ai-quants/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-GGUF/blob/main/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_S.gguf) | 476.21 MB | +| Q4_K_M | [xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q4_K_M.gguf](https://huggingface.co/featherless-ai-quants/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-GGUF/blob/main/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q4_K_M.gguf) | 636.88 MB | +| Q4_K_S | [xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q4_K_S.gguf](https://huggingface.co/featherless-ai-quants/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-GGUF/blob/main/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q4_K_S.gguf) | 610.23 MB | +| Q5_K_M | [xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q5_K_M.gguf](https://huggingface.co/featherless-ai-quants/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-GGUF/blob/main/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q5_K_M.gguf) | 745.82 MB | +| Q5_K_S | [xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q5_K_S.gguf](https://huggingface.co/featherless-ai-quants/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-GGUF/blob/main/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q5_K_S.gguf) | 730.54 MB | +| Q6_K | [xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q6_K.gguf](https://huggingface.co/featherless-ai-quants/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-GGUF/blob/main/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q6_K.gguf) | 861.56 MB | +| Q8_0 | [xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q8_0.gguf](https://huggingface.co/featherless-ai-quants/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-GGUF/blob/main/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q8_0.gguf) | 1115.62 MB | + + +--- + +## ⚡ Powered by [Featherless AI](https://featherless.ai) + +### Key Features + +- 🔥 **Instant Hosting** - Deploy any Llama model on HuggingFace instantly +- 🛠️ **Zero Infrastructure** - No server setup or maintenance required +- 📚 **Vast Compatibility** - Support for 2400+ models and counting +- 💎 **Affordable Pricing** - Starting at just $10/month + +--- + +**Links:** +[Get Started](https://featherless.ai) | [Documentation](https://featherless.ai/docs) | [Models](https://featherless.ai/models) \ No newline at end of file diff --git a/featherless-quants.png b/featherless-quants.png new file mode 100644 index 0000000..3e0eab9 --- /dev/null +++ b/featherless-quants.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e1b4d66c8306c7b0614089381fdf86ea4efb02dffb78d22767a084cb8b88d6b +size 1614532 diff --git a/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-IQ4_XS.gguf b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-IQ4_XS.gguf new file mode 100644 index 0000000..cdaff9f --- /dev/null +++ b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa8daaf6cc975b9835bd93b514d97e30e100d09cb854896a851dfa5d25fbeaf6 +size 609807936 diff --git a/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q2_K.gguf b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q2_K.gguf new file mode 100644 index 0000000..d904eca --- /dev/null +++ b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f07bd51b07561dc8bfec7aa7531c7618e51f227f4e07cdfe5883bddf211c1d7 +size 432131648 diff --git a/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_L.gguf b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_L.gguf new file mode 100644 index 0000000..8623882 --- /dev/null +++ b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3f36d93be6e23e7c365cc87b064a334f10057d7407e93ea184cb5018dfe444c +size 591527488 diff --git a/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_M.gguf b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_M.gguf new file mode 100644 index 0000000..d3406c1 --- /dev/null +++ b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:241e15dbe88693dbcc1532c1accfe82a0d7e2d7dba6df0c34a3b5fb1a85d632f +size 548404800 diff --git a/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_S.gguf b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_S.gguf new file mode 100644 index 0000000..f5cb4cb --- /dev/null +++ b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc031a5e7a33716baa7a35e7a2932b350f0aeccf4d520be1bb6976f93810e2c7 +size 499342912 diff --git a/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q4_K_M.gguf b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q4_K_M.gguf new file mode 100644 index 0000000..df382e4 --- /dev/null +++ b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44ba7111ed1208804875ce26d22438cac3eb9dd4e0a66b4c0754575c3950be65 +size 667815488 diff --git a/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q4_K_S.gguf b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q4_K_S.gguf new file mode 100644 index 0000000..2744edf --- /dev/null +++ b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97dfab126525ab712bd1a81bd60d19758f4aa3bbec7b82b496cb71d3e61ab76e +size 639872576 diff --git a/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q5_K_M.gguf b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q5_K_M.gguf new file mode 100644 index 0000000..d86b564 --- /dev/null +++ b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4524962d27b093733113e22ec834e1c5833cb63aff7562674e30e6d2d46abd2 +size 782044736 diff --git a/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q5_K_S.gguf b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q5_K_S.gguf new file mode 100644 index 0000000..ee4298c --- /dev/null +++ b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ae60316e6c2d99d9a87b5a1ab33c51d1f86ecd8de6bc9d0f07f51185405430a +size 766029376 diff --git a/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q6_K.gguf b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q6_K.gguf new file mode 100644 index 0000000..cafba09 --- /dev/null +++ b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c87acd5ab7046246f02458f1862cce22e004608848b54c8c3787b1933e044d46 +size 903413312 diff --git a/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q8_0.gguf b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q8_0.gguf new file mode 100644 index 0000000..6a822d4 --- /dev/null +++ b/xw17-TinyLlama-1.1B-Chat-v1.0_finetuned_s01_3-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c42da9027f82b58fb703647f09884cbcbd01e682622efe88ef735e59703fad2f +size 1169808960