From d298c1800726be0adcf5d1aa597811de54853d1c Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Mon, 22 Jun 2026 04:21:13 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: featherless-ai-quants/Qwen-Qwen2.5-7B-Instruct-1M-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++++++++++ Qwen-Qwen2.5-7B-Instruct-1M-IQ4_XS.gguf | 3 ++ Qwen-Qwen2.5-7B-Instruct-1M-Q2_K.gguf | 3 ++ Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_L.gguf | 3 ++ Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_M.gguf | 3 ++ Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_S.gguf | 3 ++ Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_M.gguf | 3 ++ Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_S.gguf | 3 ++ Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_M.gguf | 3 ++ Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_S.gguf | 3 ++ Qwen-Qwen2.5-7B-Instruct-1M-Q6_K.gguf | 3 ++ Qwen-Qwen2.5-7B-Instruct-1M-Q8_0.gguf | 3 ++ README.md | 47 +++++++++++++++++++ configuration.json | 1 + featherless-quants.png | 3 ++ 15 files changed, 144 insertions(+) create mode 100644 .gitattributes create mode 100644 Qwen-Qwen2.5-7B-Instruct-1M-IQ4_XS.gguf create mode 100644 Qwen-Qwen2.5-7B-Instruct-1M-Q2_K.gguf create mode 100644 Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_L.gguf create mode 100644 Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_M.gguf create mode 100644 Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_S.gguf create mode 100644 Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_M.gguf create mode 100644 Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_S.gguf create mode 100644 Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_M.gguf create mode 100644 Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_S.gguf create mode 100644 Qwen-Qwen2.5-7B-Instruct-1M-Q6_K.gguf create mode 100644 Qwen-Qwen2.5-7B-Instruct-1M-Q8_0.gguf create mode 100644 README.md create mode 100644 configuration.json create mode 100644 featherless-quants.png diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..ec466a4 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bin.* filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text + +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text + +Qwen-Qwen2.5-7B-Instruct-1M-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Qwen-Qwen2.5-7B-Instruct-1M-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +featherless-quants.png filter=lfs diff=lfs merge=lfs -text +Qwen-Qwen2.5-7B-Instruct-1M-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Qwen-Qwen2.5-7B-Instruct-1M-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/Qwen-Qwen2.5-7B-Instruct-1M-IQ4_XS.gguf b/Qwen-Qwen2.5-7B-Instruct-1M-IQ4_XS.gguf new file mode 100644 index 0000000..47934d4 --- /dev/null +++ b/Qwen-Qwen2.5-7B-Instruct-1M-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94bb227e53bfb1fd0b135d1febf51161c655211a6ac8139ff3f65add815e3801 +size 4250298720 diff --git a/Qwen-Qwen2.5-7B-Instruct-1M-Q2_K.gguf b/Qwen-Qwen2.5-7B-Instruct-1M-Q2_K.gguf new file mode 100644 index 0000000..55f9825 --- /dev/null +++ b/Qwen-Qwen2.5-7B-Instruct-1M-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b43e86080bbb2aeecd7b05a281420f66d6c022131280bab3b9665ddd69c8daca +size 3015940448 diff --git a/Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_L.gguf b/Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_L.gguf new file mode 100644 index 0000000..d6f5697 --- /dev/null +++ b/Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28d010bdc57be9a6be5dfa58e7415660a340fa3929425ddc9b405c80ebb77031 +size 4088459616 diff --git a/Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_M.gguf b/Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_M.gguf new file mode 100644 index 0000000..909dd30 --- /dev/null +++ b/Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b082235cbf88929e4369557d42f1540d6bfcce1b83770ec6b5f04131a3760788 +size 3808391520 diff --git a/Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_S.gguf b/Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_S.gguf new file mode 100644 index 0000000..9647a02 --- /dev/null +++ b/Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f926d919cf02f522b3417150294790b703642432329189124dd85c963ddb4d8 +size 3492368736 diff --git a/Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_M.gguf b/Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_M.gguf new file mode 100644 index 0000000..d9ac69b --- /dev/null +++ b/Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea2c1c1124eec603c1f2745598a7f2d293a975f6350bda9985777aacd7c4d899 +size 4683073888 diff --git a/Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_S.gguf b/Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_S.gguf new file mode 100644 index 0000000..3eaf85e --- /dev/null +++ b/Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb4635d23bd22fd829b089d48a522aa004d90128f7e4b2a6d1e6837f3962eb2a +size 4457769312 diff --git a/Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_M.gguf b/Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_M.gguf new file mode 100644 index 0000000..f1a497e --- /dev/null +++ b/Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:038ce331ba4ff9eeb072c2523e0897560094e94d08b626c0c66fd4b635f035ca +size 5444831584 diff --git a/Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_S.gguf b/Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_S.gguf new file mode 100644 index 0000000..9e3d65d --- /dev/null +++ b/Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8898ee49e7ed717c37ab6220c49316c5e068b9438082d8c1c8f92422057c3148 +size 5315176800 diff --git a/Qwen-Qwen2.5-7B-Instruct-1M-Q6_K.gguf b/Qwen-Qwen2.5-7B-Instruct-1M-Q6_K.gguf new file mode 100644 index 0000000..9e69b1a --- /dev/null +++ b/Qwen-Qwen2.5-7B-Instruct-1M-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18ce0c1682f74092c5157bdbe5cdb1ac0cb4a8708a726af71e0e14a96df3838d +size 6254199136 diff --git a/Qwen-Qwen2.5-7B-Instruct-1M-Q8_0.gguf b/Qwen-Qwen2.5-7B-Instruct-1M-Q8_0.gguf new file mode 100644 index 0000000..8c2efab --- /dev/null +++ b/Qwen-Qwen2.5-7B-Instruct-1M-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d49a7051f078abd0088b7b3af092179b5c7218e507798d74c10dad074ebae602 +size 8098525536 diff --git a/README.md b/README.md new file mode 100644 index 0000000..7bc2c95 --- /dev/null +++ b/README.md @@ -0,0 +1,47 @@ +--- +base_model: Qwen/Qwen2.5-7B-Instruct-1M +pipeline_tag: text-generation +quantized_by: featherless-ai-quants +--- + +# Qwen/Qwen2.5-7B-Instruct-1M GGUF Quantizations 🚀 + +![Featherless AI Quants](./featherless-quants.png) + +*Optimized GGUF quantization files for enhanced model performance* + +> Powered by [Featherless AI](https://featherless.ai) - run any model you'd like for a simple small fee. +--- + +## Available Quantizations 📊 + +| Quantization Type | File | Size | +|-------------------|------|------| +| IQ4_XS | [Qwen-Qwen2.5-7B-Instruct-1M-IQ4_XS.gguf](https://huggingface.co/featherless-ai-quants/Qwen-Qwen2.5-7B-Instruct-1M-GGUF/blob/main/Qwen-Qwen2.5-7B-Instruct-1M-IQ4_XS.gguf) | 4053.40 MB | +| Q2_K | [Qwen-Qwen2.5-7B-Instruct-1M-Q2_K.gguf](https://huggingface.co/featherless-ai-quants/Qwen-Qwen2.5-7B-Instruct-1M-GGUF/blob/main/Qwen-Qwen2.5-7B-Instruct-1M-Q2_K.gguf) | 2876.22 MB | +| Q3_K_L | [Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_L.gguf](https://huggingface.co/featherless-ai-quants/Qwen-Qwen2.5-7B-Instruct-1M-GGUF/blob/main/Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_L.gguf) | 3899.06 MB | +| Q3_K_M | [Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_M.gguf](https://huggingface.co/featherless-ai-quants/Qwen-Qwen2.5-7B-Instruct-1M-GGUF/blob/main/Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_M.gguf) | 3631.97 MB | +| Q3_K_S | [Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_S.gguf](https://huggingface.co/featherless-ai-quants/Qwen-Qwen2.5-7B-Instruct-1M-GGUF/blob/main/Qwen-Qwen2.5-7B-Instruct-1M-Q3_K_S.gguf) | 3330.58 MB | +| Q4_K_M | [Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_M.gguf](https://huggingface.co/featherless-ai-quants/Qwen-Qwen2.5-7B-Instruct-1M-GGUF/blob/main/Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_M.gguf) | 4466.13 MB | +| Q4_K_S | [Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_S.gguf](https://huggingface.co/featherless-ai-quants/Qwen-Qwen2.5-7B-Instruct-1M-GGUF/blob/main/Qwen-Qwen2.5-7B-Instruct-1M-Q4_K_S.gguf) | 4251.26 MB | +| Q5_K_M | [Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_M.gguf](https://huggingface.co/featherless-ai-quants/Qwen-Qwen2.5-7B-Instruct-1M-GGUF/blob/main/Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_M.gguf) | 5192.60 MB | +| Q5_K_S | [Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_S.gguf](https://huggingface.co/featherless-ai-quants/Qwen-Qwen2.5-7B-Instruct-1M-GGUF/blob/main/Qwen-Qwen2.5-7B-Instruct-1M-Q5_K_S.gguf) | 5068.95 MB | +| Q6_K | [Qwen-Qwen2.5-7B-Instruct-1M-Q6_K.gguf](https://huggingface.co/featherless-ai-quants/Qwen-Qwen2.5-7B-Instruct-1M-GGUF/blob/main/Qwen-Qwen2.5-7B-Instruct-1M-Q6_K.gguf) | 5964.47 MB | +| Q8_0 | [Qwen-Qwen2.5-7B-Instruct-1M-Q8_0.gguf](https://huggingface.co/featherless-ai-quants/Qwen-Qwen2.5-7B-Instruct-1M-GGUF/blob/main/Qwen-Qwen2.5-7B-Instruct-1M-Q8_0.gguf) | 7723.36 MB | + + +--- + +## ⚡ Powered by [Featherless AI](https://featherless.ai) + +### Key Features + +- 🔥 **Instant Hosting** - Deploy any Llama model on HuggingFace instantly +- 🛠️ **Zero Infrastructure** - No server setup or maintenance required +- 📚 **Vast Compatibility** - Support for 2400+ models and counting +- 💎 **Affordable Pricing** - Starting at just $10/month + +--- + +**Links:** +[Get Started](https://featherless.ai) | [Documentation](https://featherless.ai/docs) | [Models](https://featherless.ai/models) \ No newline at end of file diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file diff --git a/featherless-quants.png b/featherless-quants.png new file mode 100644 index 0000000..3e0eab9 --- /dev/null +++ b/featherless-quants.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e1b4d66c8306c7b0614089381fdf86ea4efb02dffb78d22767a084cb8b88d6b +size 1614532