commit 31290985e8ef83fdaf435f7e45a4f7940f3e81ed Author: ModelHub XC Date: Tue May 26 22:12:21 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..dc4e094 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen3-1.7B-ShiningValiant3.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Qwen3-1.7B-ShiningValiant3.i1-IQ1_M.gguf b/Qwen3-1.7B-ShiningValiant3.i1-IQ1_M.gguf new file mode 100644 index 0000000..6ec6509 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f1cfa60afe476dcc1e97a88eeeb844b76e18d8c20e3d03db47f3a9ac4c35727 +size 543795776 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-IQ1_S.gguf b/Qwen3-1.7B-ShiningValiant3.i1-IQ1_S.gguf new file mode 100644 index 0000000..29bfd0e --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fac5f4b32b3e88454e4851b6c61ef2b693501888cca8e2c71c02a2267d8be382 +size 515779136 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-IQ2_M.gguf b/Qwen3-1.7B-ShiningValiant3.i1-IQ2_M.gguf new file mode 100644 index 0000000..49cea6e --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec65b3a5649e03e0409d9c875e94bd82ebcd0f8a9dc2a9e99ba8e22196eb139e +size 695183936 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-IQ2_S.gguf b/Qwen3-1.7B-ShiningValiant3.i1-IQ2_S.gguf new file mode 100644 index 0000000..e492c21 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f764b49258ed46219f4c33a29e9f9967670cdf2b0591218ead8b87f30e2272c0 +size 657828416 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-IQ2_XS.gguf b/Qwen3-1.7B-ShiningValiant3.i1-IQ2_XS.gguf new file mode 100644 index 0000000..e103b20 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:366857f892a013fc8fa22b1c1709713a988ae16f244a2d42d9bd5afa00922469 +size 631515712 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-IQ2_XXS.gguf b/Qwen3-1.7B-ShiningValiant3.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..3f1e810 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3ab29cf4d18089556e57b59131b094ce5371d0cfc7b0541a0b3ecd16fc30494 +size 590490176 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-IQ3_M.gguf b/Qwen3-1.7B-ShiningValiant3.i1-IQ3_M.gguf new file mode 100644 index 0000000..c2ba5ca --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0439567b3f2f6177fadc8812cbb8a2d2f89a4bf780c5aa9984d1b3892aaa4b84 +size 895664704 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-IQ3_S.gguf b/Qwen3-1.7B-ShiningValiant3.i1-IQ3_S.gguf new file mode 100644 index 0000000..ee661e6 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca003832880a56c43ad6fbb48232fde8043bc78254616336f309a2704ccf189 +size 867254848 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-IQ3_XS.gguf b/Qwen3-1.7B-ShiningValiant3.i1-IQ3_XS.gguf new file mode 100644 index 0000000..b1f0e0a --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ab3ac72556270416a69cb91986b706e6e8c6f8681f7f16c53159a167bc8520 +size 834224704 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-IQ3_XXS.gguf b/Qwen3-1.7B-ShiningValiant3.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..2d2ece3 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:381c6b23a4a110fca112073be2f3422ac6c6e47149c884a1f22cdcecbf7c95cf +size 754362944 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-IQ4_NL.gguf b/Qwen3-1.7B-ShiningValiant3.i1-IQ4_NL.gguf new file mode 100644 index 0000000..0bf5081 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e724962a2f3288097516184029e12d7864b4d20b2ab66cef49765a81060f9fe +size 1054425664 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-IQ4_XS.gguf b/Qwen3-1.7B-ShiningValiant3.i1-IQ4_XS.gguf new file mode 100644 index 0000000..10ea609 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a8e1e30ed4510f1ce13b468ebc643437031371146d0ed8626e6ba825281f1b9 +size 1010385472 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-Q2_K.gguf b/Qwen3-1.7B-ShiningValiant3.i1-Q2_K.gguf new file mode 100644 index 0000000..7eba82d --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dd7c04e6ff6019c6f1f6b2adf0d39b05d9f2b9c3e13f2047e826adbacde0273 +size 777798208 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-Q2_K_S.gguf b/Qwen3-1.7B-ShiningValiant3.i1-Q2_K_S.gguf new file mode 100644 index 0000000..5d4e8ef --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85812b5eebeff7c67f35819017c34a958bff23ee520c76db65971e8f272d9d14 +size 732971584 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-Q3_K_L.gguf b/Qwen3-1.7B-ShiningValiant3.i1-Q3_K_L.gguf new file mode 100644 index 0000000..049f5c3 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90776b207d3a2bc03e23a13f9f71173a3f7b1cd88e7dd6a5ada6ca2232b49201 +size 1003504192 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-Q3_K_M.gguf b/Qwen3-1.7B-ShiningValiant3.i1-Q3_K_M.gguf new file mode 100644 index 0000000..a499a51 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:debd0ddea83fa9d979a9e9a3d6f468c2ce068c90c0fb9c16506c3f44fd1b4653 +size 939541056 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-Q3_K_S.gguf b/Qwen3-1.7B-ShiningValiant3.i1-Q3_K_S.gguf new file mode 100644 index 0000000..a0e92ba --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0ad948c24128c1a3db991224f9b0bcddf270072c7203aa93856389b5e367a9d +size 867254848 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-Q4_0.gguf b/Qwen3-1.7B-ShiningValiant3.i1-Q4_0.gguf new file mode 100644 index 0000000..029e3b6 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d97a825fe745d2ebabc9da54116d7dfbdfb87ce26a4b1f5cde42776c70636347 +size 1056784960 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-Q4_1.gguf b/Qwen3-1.7B-ShiningValiant3.i1-Q4_1.gguf new file mode 100644 index 0000000..e59cd85 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:511516b375eaf7a7cb46271de97ba676e2a69eefcf1decb446f39132b339f80a +size 1142506048 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-Q4_K_M.gguf b/Qwen3-1.7B-ShiningValiant3.i1-Q4_K_M.gguf new file mode 100644 index 0000000..3c5c508 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbc718649c15e2106a29dbdca26ea008efa720f5f8bd82c99290310f8ede56f4 +size 1107411520 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-Q4_K_S.gguf b/Qwen3-1.7B-ShiningValiant3.i1-Q4_K_S.gguf new file mode 100644 index 0000000..bca065c --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdfa9e9ff6d85ebff56b7b5fb76d327c1f3ddf1d01137be831637cfc6ab25b6d +size 1060192832 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-Q5_K_M.gguf b/Qwen3-1.7B-ShiningValiant3.i1-Q5_K_M.gguf new file mode 100644 index 0000000..c8a9bd3 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:904523bd3661ca21a23fd3b39f4cedad6df06137b16da0cd5e6c21c1531d27c1 +size 1257882176 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-Q5_K_S.gguf b/Qwen3-1.7B-ShiningValiant3.i1-Q5_K_S.gguf new file mode 100644 index 0000000..2010565 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621d027f91192e9a0635148cd3fc2370ea484287d041935befef4362485f2f7c +size 1230586432 diff --git a/Qwen3-1.7B-ShiningValiant3.i1-Q6_K.gguf b/Qwen3-1.7B-ShiningValiant3.i1-Q6_K.gguf new file mode 100644 index 0000000..ec8fd18 --- /dev/null +++ b/Qwen3-1.7B-ShiningValiant3.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1d6de3063a21624df3c2fb54e3cb3e2115b1848490dabfd64f4f0d256afabb9 +size 1417757248 diff --git a/README.md b/README.md new file mode 100644 index 0000000..27f3cbf --- /dev/null +++ b/README.md @@ -0,0 +1,139 @@ +--- +base_model: ValiantLabs/Qwen3-1.7B-ShiningValiant3 +datasets: +- sequelbox/Celestia3-DeepSeek-R1-0528 +- sequelbox/Mitakihara-DeepSeek-R1-0528 +- sequelbox/Raiden-DeepSeek-R1 +language: +- en +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- shining-valiant +- shining-valiant-3 +- valiant +- valiant-labs +- qwen +- qwen-3 +- qwen-3-1.7b +- 1.7b +- reasoning +- code +- code-reasoning +- science +- science-reasoning +- physics +- biology +- chemistry +- earth-science +- astronomy +- machine-learning +- artificial-intelligence +- compsci +- computer-science +- information-theory +- ML-Ops +- math +- cuda +- deep-learning +- transformers +- agentic +- LLM +- neuromorphic +- self-improvement +- complex-systems +- cognition +- linguistics +- philosophy +- logic +- epistemology +- simulation +- game-theory +- knowledge-management +- creativity +- problem-solving +- architect +- engineer +- developer +- creative +- analytical +- expert +- rationality +- conversational +- chat +- instruct +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/ValiantLabs/Qwen3-1.7B-ShiningValiant3 + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Qwen3-1.7B-ShiningValiant3-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-IQ1_S.gguf) | i1-IQ1_S | 0.6 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-IQ1_M.gguf) | i1-IQ1_M | 0.6 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-IQ2_S.gguf) | i1-IQ2_S | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-IQ2_M.gguf) | i1-IQ2_M | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.8 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-Q2_K.gguf) | i1-Q2_K | 0.9 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-IQ3_S.gguf) | i1-IQ3_S | 1.0 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-Q3_K_S.gguf) | i1-Q3_K_S | 1.0 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-IQ3_M.gguf) | i1-IQ3_M | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.0 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.1 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-IQ4_NL.gguf) | i1-IQ4_NL | 1.2 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-Q4_0.gguf) | i1-Q4_0 | 1.2 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-Q4_K_S.gguf) | i1-Q4_K_S | 1.2 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-Q4_K_M.gguf) | i1-Q4_K_M | 1.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-Q4_1.gguf) | i1-Q4_1 | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-Q5_K_S.gguf) | i1-Q5_K_S | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-Q5_K_M.gguf) | i1-Q5_K_M | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen3-1.7B-ShiningValiant3-i1-GGUF/resolve/main/Qwen3-1.7B-ShiningValiant3.i1-Q6_K.gguf) | i1-Q6_K | 1.5 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..73a4b7b --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef8136df2b9e9468decf98fee0a2711baa234cd0fd4c38e4cffd1ff100a3d2f7 +size 2070873