commit f86eee3a6d137182e627691b767d7238fd662b04 Author: ModelHub XC Date: Mon May 25 17:24:18 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/TinyV-Qwen3-1.7B-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..25f33f6 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +TinyV-Qwen3-1.7B.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +TinyV-Qwen3-1.7B.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +TinyV-Qwen3-1.7B.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +TinyV-Qwen3-1.7B.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +TinyV-Qwen3-1.7B.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +TinyV-Qwen3-1.7B.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +TinyV-Qwen3-1.7B.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +TinyV-Qwen3-1.7B.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +TinyV-Qwen3-1.7B.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +TinyV-Qwen3-1.7B.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +TinyV-Qwen3-1.7B.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +TinyV-Qwen3-1.7B.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..56dffa6 --- /dev/null +++ b/README.md @@ -0,0 +1,73 @@ +--- +base_model: zhangchenxu/TinyV-Qwen3-1.7B +language: +- en +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- llama-factory +- full +- generated_from_trainer +--- +## About + + + + + + +static quants of https://huggingface.co/zhangchenxu/TinyV-Qwen3-1.7B + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#TinyV-Qwen3-1.7B-GGUF).*** + +weighted/imatrix quants are available at https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-i1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-GGUF/resolve/main/TinyV-Qwen3-1.7B.Q2_K.gguf) | Q2_K | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-GGUF/resolve/main/TinyV-Qwen3-1.7B.Q3_K_S.gguf) | Q3_K_S | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-GGUF/resolve/main/TinyV-Qwen3-1.7B.Q3_K_M.gguf) | Q3_K_M | 1.0 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-GGUF/resolve/main/TinyV-Qwen3-1.7B.Q3_K_L.gguf) | Q3_K_L | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-GGUF/resolve/main/TinyV-Qwen3-1.7B.IQ4_XS.gguf) | IQ4_XS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-GGUF/resolve/main/TinyV-Qwen3-1.7B.Q4_K_S.gguf) | Q4_K_S | 1.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-GGUF/resolve/main/TinyV-Qwen3-1.7B.Q4_K_M.gguf) | Q4_K_M | 1.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-GGUF/resolve/main/TinyV-Qwen3-1.7B.Q5_K_S.gguf) | Q5_K_S | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-GGUF/resolve/main/TinyV-Qwen3-1.7B.Q5_K_M.gguf) | Q5_K_M | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-GGUF/resolve/main/TinyV-Qwen3-1.7B.Q6_K.gguf) | Q6_K | 1.5 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-GGUF/resolve/main/TinyV-Qwen3-1.7B.Q8_0.gguf) | Q8_0 | 1.9 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/TinyV-Qwen3-1.7B-GGUF/resolve/main/TinyV-Qwen3-1.7B.f16.gguf) | f16 | 3.5 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + + diff --git a/TinyV-Qwen3-1.7B.IQ4_XS.gguf b/TinyV-Qwen3-1.7B.IQ4_XS.gguf new file mode 100644 index 0000000..ae4c69d --- /dev/null +++ b/TinyV-Qwen3-1.7B.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff7f4b1141cdb900443e1cc82b9226f8a4561826f8baaf843a08f305cac1025 +size 1016277376 diff --git a/TinyV-Qwen3-1.7B.Q2_K.gguf b/TinyV-Qwen3-1.7B.Q2_K.gguf new file mode 100644 index 0000000..00d8487 --- /dev/null +++ b/TinyV-Qwen3-1.7B.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c0b181d886ab0a012c97972e375261ee75d99308be978704e4aa71d7bbfa2b7 +size 777791872 diff --git a/TinyV-Qwen3-1.7B.Q3_K_L.gguf b/TinyV-Qwen3-1.7B.Q3_K_L.gguf new file mode 100644 index 0000000..57fb731 --- /dev/null +++ b/TinyV-Qwen3-1.7B.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd2ab0714a357c687cb9b2ff0593a20aafd211022fdf50cef8f9a2d4f26ccc9a +size 1003497856 diff --git a/TinyV-Qwen3-1.7B.Q3_K_M.gguf b/TinyV-Qwen3-1.7B.Q3_K_M.gguf new file mode 100644 index 0000000..a29a739 --- /dev/null +++ b/TinyV-Qwen3-1.7B.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35f9544c09bb0c6316ca39de3923490e92f3e50d3031862df8859d48a154b328 +size 939534720 diff --git a/TinyV-Qwen3-1.7B.Q3_K_S.gguf b/TinyV-Qwen3-1.7B.Q3_K_S.gguf new file mode 100644 index 0000000..abd0f4e --- /dev/null +++ b/TinyV-Qwen3-1.7B.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2e4166c1e003e0462731077753e01e90419b995e5b430a8d35a58b747a8739f +size 867248512 diff --git a/TinyV-Qwen3-1.7B.Q4_K_M.gguf b/TinyV-Qwen3-1.7B.Q4_K_M.gguf new file mode 100644 index 0000000..aecc4ba --- /dev/null +++ b/TinyV-Qwen3-1.7B.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b7d4362e106bf6ca2f95dcf1bb0d326dccf2a3ff388ab9ba85129c7171ce7c7 +size 1107405184 diff --git a/TinyV-Qwen3-1.7B.Q4_K_S.gguf b/TinyV-Qwen3-1.7B.Q4_K_S.gguf new file mode 100644 index 0000000..f8d0749 --- /dev/null +++ b/TinyV-Qwen3-1.7B.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7d9a2f562a7a6a7903d2506e7cefab73d0f90a5bfdaa7fe9f9e716d9402ceb4 +size 1060186496 diff --git a/TinyV-Qwen3-1.7B.Q5_K_M.gguf b/TinyV-Qwen3-1.7B.Q5_K_M.gguf new file mode 100644 index 0000000..1b1975e --- /dev/null +++ b/TinyV-Qwen3-1.7B.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e0c70d31a74fd4297d58dc326d576c9e6ad16952b83cb68cb9c9535f14a6517 +size 1257875840 diff --git a/TinyV-Qwen3-1.7B.Q5_K_S.gguf b/TinyV-Qwen3-1.7B.Q5_K_S.gguf new file mode 100644 index 0000000..eb9f405 --- /dev/null +++ b/TinyV-Qwen3-1.7B.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f505d225b95428a4282d0549afd3f6494063202baf944af3546d90b87030a9f +size 1230580096 diff --git a/TinyV-Qwen3-1.7B.Q6_K.gguf b/TinyV-Qwen3-1.7B.Q6_K.gguf new file mode 100644 index 0000000..ec29d7d --- /dev/null +++ b/TinyV-Qwen3-1.7B.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bddab37e627b300461d093c5c0b72e49ef15208f755964d1e03d8ddc509d1dc +size 1417750912 diff --git a/TinyV-Qwen3-1.7B.Q8_0.gguf b/TinyV-Qwen3-1.7B.Q8_0.gguf new file mode 100644 index 0000000..4c3da39 --- /dev/null +++ b/TinyV-Qwen3-1.7B.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f24ffe46e100bfd7e0594f806b107499d8e9448dfb094bc15d22a835809ed499 +size 1834422656 diff --git a/TinyV-Qwen3-1.7B.f16.gguf b/TinyV-Qwen3-1.7B.f16.gguf new file mode 100644 index 0000000..54a8c35 --- /dev/null +++ b/TinyV-Qwen3-1.7B.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0c9662a3fb387acfafdf367ee6d0cb750c652d144ed9de91435ba44e4d86586 +size 3447345536