初始化项目,由ModelHub XC社区提供模型
Model: mradermacher/Qwen2-1.5B-GGUF Source: Original Platform
This commit is contained in:
62
.gitattributes
vendored
Normal file
62
.gitattributes
vendored
Normal file
@@ -0,0 +1,62 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.f16.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Qwen2-1.5B.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
qwen2-1.5b.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
qwen2-1.5b.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
qwen2-1.5b.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
qwen2-1.5b.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
qwen2-1.5b.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
qwen2-1.5b.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
qwen2-1.5b.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
qwen2-1.5b.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
qwen2-1.5b.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
qwen2-1.5b.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
qwen2-1.5b.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
qwen2-1.5b.f16.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
3
Qwen2-1.5B.IQ3_M.gguf
Normal file
3
Qwen2-1.5B.IQ3_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:31cca7d1258598c575ab0fe416e84d84b74ae6e63b53817834efb4c463816fbb
|
||||
size 776661504
|
||||
3
Qwen2-1.5B.IQ3_S.gguf
Normal file
3
Qwen2-1.5B.IQ3_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:beb55f90e72c198ff5c7834061d9c797343470ef5f613bf0c1ec1599990455a8
|
||||
size 762404352
|
||||
3
Qwen2-1.5B.IQ3_XS.gguf
Normal file
3
Qwen2-1.5B.IQ3_XS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:5eda20b723178f408076de5598cac365758e4499c07f825d8d6c6dce609098d5
|
||||
size 731696640
|
||||
3
Qwen2-1.5B.IQ4_XS.gguf
Normal file
3
Qwen2-1.5B.IQ4_XS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:6dfe5ec0937d81353e9186c49395ba317b7a742842a44883dc949ff3e7be0eeb
|
||||
size 902180352
|
||||
3
Qwen2-1.5B.Q2_K.gguf
Normal file
3
Qwen2-1.5B.Q2_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:5781f0a40005f7c6d38847fca51d63b20675dfe96ad5bc255480a9b91c9003e0
|
||||
size 676302336
|
||||
3
Qwen2-1.5B.Q3_K_L.gguf
Normal file
3
Qwen2-1.5B.Q3_K_L.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:03bad7381fc9b1d8453e4fcd8a2bbcc372841dc9a13a40e90728e7047ec118d4
|
||||
size 880160256
|
||||
3
Qwen2-1.5B.Q3_K_M.gguf
Normal file
3
Qwen2-1.5B.Q3_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:bcc4770dbd3cc5d8d34e7e5f59c607071e022da02a565a2f67d63b787cb7eaa0
|
||||
size 824176128
|
||||
3
Qwen2-1.5B.Q3_K_S.gguf
Normal file
3
Qwen2-1.5B.Q3_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:12f6e1c90771c059c34638ebb5e183f76be343633ba786529ec2b28f90c2bc3c
|
||||
size 760942080
|
||||
3
Qwen2-1.5B.Q4_K_M.gguf
Normal file
3
Qwen2-1.5B.Q4_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:65bbaf292ba66050e4b08e991c54b22abb544434efbb8bfa7d838d9ac2840d34
|
||||
size 986045952
|
||||
3
Qwen2-1.5B.Q4_K_S.gguf
Normal file
3
Qwen2-1.5B.Q4_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:66dc5e782ff14f1418487a940c272715abad817abc0c68634569526ea6b67e8c
|
||||
size 940310016
|
||||
3
Qwen2-1.5B.Q5_K_M.gguf
Normal file
3
Qwen2-1.5B.Q5_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:3ad67a227879b4c648a41b49cc986e0fd20fbcc672e08627e7cd7bc594a9c128
|
||||
size 1125047808
|
||||
3
Qwen2-1.5B.Q5_K_S.gguf
Normal file
3
Qwen2-1.5B.Q5_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:10858645a9baac8cbf120f320f3f63addaa3db0bb1588a48d5919d7334212523
|
||||
size 1098726912
|
||||
3
Qwen2-1.5B.Q6_K.gguf
Normal file
3
Qwen2-1.5B.Q6_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:5179e0418e592515287dbd88546ab8022a8a544918cd13af0174f835c3b9abf9
|
||||
size 1272737280
|
||||
3
Qwen2-1.5B.Q8_0.gguf
Normal file
3
Qwen2-1.5B.Q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:516151168017cfdf4a9d9481d01e9ebd1b6029f83c10f03f0a7fab16d87321bc
|
||||
size 1646570496
|
||||
3
Qwen2-1.5B.f16.gguf
Normal file
3
Qwen2-1.5B.f16.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:9223c65c748b43d1a4a3595e7068c052d34b2c13555cb01d6b50857c400a438b
|
||||
size 3093666816
|
||||
69
README.md
Normal file
69
README.md
Normal file
@@ -0,0 +1,69 @@
|
||||
---
|
||||
base_model: Qwen/Qwen2-1.5B
|
||||
language:
|
||||
- en
|
||||
library_name: transformers
|
||||
license: apache-2.0
|
||||
quantized_by: mradermacher
|
||||
tags:
|
||||
- pretrained
|
||||
---
|
||||
## About
|
||||
|
||||
<!-- ### quantize_version: 2 -->
|
||||
<!-- ### output_tensor_quantised: 1 -->
|
||||
<!-- ### convert_type: hf -->
|
||||
<!-- ### vocab_type: -->
|
||||
<!-- ### tags: -->
|
||||
static quants of https://huggingface.co/Qwen/Qwen2-1.5B
|
||||
|
||||
<!-- provided-files -->
|
||||
weighted/imatrix quants are available at https://huggingface.co/mradermacher/Qwen2-1.5B-i1-GGUF
|
||||
## Usage
|
||||
|
||||
If you are unsure how to use GGUF files, refer to one of [TheBloke's
|
||||
READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for
|
||||
more details, including on how to concatenate multi-part files.
|
||||
|
||||
## Provided Quants
|
||||
|
||||
(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants)
|
||||
|
||||
| Link | Type | Size/GB | Notes |
|
||||
|:-----|:-----|--------:|:------|
|
||||
| [GGUF](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.IQ3_XS.gguf) | IQ3_XS | 0.8 | |
|
||||
| [GGUF](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.IQ3_S.gguf) | IQ3_S | 0.9 | beats Q3_K* |
|
||||
| [GGUF](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.IQ3_M.gguf) | IQ3_M | 0.9 | |
|
||||
| [PART 1](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.Q2_K.gguf) [PART 2](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/qwen2-1.5b.Q2_K.gguf) | Q2_K | 1.5 | |
|
||||
| [PART 1](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.Q3_K_S.gguf) [PART 2](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/qwen2-1.5b.Q3_K_S.gguf) | Q3_K_S | 1.6 | |
|
||||
| [PART 1](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.Q3_K_M.gguf) [PART 2](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/qwen2-1.5b.Q3_K_M.gguf) | Q3_K_M | 1.7 | lower quality |
|
||||
| [PART 1](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.Q3_K_L.gguf) [PART 2](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/qwen2-1.5b.Q3_K_L.gguf) | Q3_K_L | 1.9 | |
|
||||
| [PART 1](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.IQ4_XS.gguf) [PART 2](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/qwen2-1.5b.IQ4_XS.gguf) | IQ4_XS | 1.9 | |
|
||||
| [PART 1](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.Q4_K_S.gguf) [PART 2](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/qwen2-1.5b.Q4_K_S.gguf) | Q4_K_S | 2.0 | fast, recommended |
|
||||
| [PART 1](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.Q4_K_M.gguf) [PART 2](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/qwen2-1.5b.Q4_K_M.gguf) | Q4_K_M | 2.1 | fast, recommended |
|
||||
| [PART 1](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.Q5_K_S.gguf) [PART 2](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/qwen2-1.5b.Q5_K_S.gguf) | Q5_K_S | 2.3 | |
|
||||
| [PART 1](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.Q5_K_M.gguf) [PART 2](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/qwen2-1.5b.Q5_K_M.gguf) | Q5_K_M | 2.3 | |
|
||||
| [PART 1](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.Q6_K.gguf) [PART 2](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/qwen2-1.5b.Q6_K.gguf) | Q6_K | 2.6 | very good quality |
|
||||
| [PART 1](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.Q8_0.gguf) [PART 2](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/qwen2-1.5b.Q8_0.gguf) | Q8_0 | 3.4 | fast, best quality |
|
||||
| [PART 1](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/Qwen2-1.5B.f16.gguf) [PART 2](https://huggingface.co/mradermacher/Qwen2-1.5B-GGUF/resolve/main/qwen2-1.5b.f16.gguf) | f16 | 6.3 | 16 bpw, overkill |
|
||||
|
||||
Here is a handy graph by ikawrakow comparing some lower-quality quant
|
||||
types (lower is better):
|
||||
|
||||

|
||||
|
||||
And here are Artefact2's thoughts on the matter:
|
||||
https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9
|
||||
|
||||
## FAQ / Model Request
|
||||
|
||||
See https://huggingface.co/mradermacher/model_requests for some answers to
|
||||
questions you might have and/or if you want some other model quantized.
|
||||
|
||||
## Thanks
|
||||
|
||||
I thank my company, [nethype GmbH](https://www.nethype.de/), for letting
|
||||
me use its servers and providing upgrades to my workstation to enable
|
||||
this work in my free time.
|
||||
|
||||
<!-- end -->
|
||||
3
qwen2-1.5b.IQ4_XS.gguf
Normal file
3
qwen2-1.5b.IQ4_XS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:01803de70931d2295641824c7a0d9585808e93885f3cb0423fcc6d7c8e4f61bc
|
||||
size 901808512
|
||||
3
qwen2-1.5b.Q2_K.gguf
Normal file
3
qwen2-1.5b.Q2_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:61fa61b3ad6f8a972793dd39c989c048a8b6a922cb4b616dcb59326630949b34
|
||||
size 675930496
|
||||
3
qwen2-1.5b.Q3_K_L.gguf
Normal file
3
qwen2-1.5b.Q3_K_L.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:26e298609badb56edd08ab0f1319dfa63d15e77ef4431658c98d43d4d63c904f
|
||||
size 879788416
|
||||
3
qwen2-1.5b.Q3_K_M.gguf
Normal file
3
qwen2-1.5b.Q3_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:1fd9cfcc248b0f2e91a3a18d9e3e2fc9b245f53ef6f2a3b00582db16ff5a50fe
|
||||
size 823804288
|
||||
3
qwen2-1.5b.Q3_K_S.gguf
Normal file
3
qwen2-1.5b.Q3_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:7a8a4b9cf65e72c464b46388490512901d50c1d687e4ed0e6bed85b9a4ff6ea8
|
||||
size 760570240
|
||||
3
qwen2-1.5b.Q4_K_M.gguf
Normal file
3
qwen2-1.5b.Q4_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:7dd7fa5547557f8577fc42f52bbd8add9bb59f480aa2f488e437e0b23ceae5e3
|
||||
size 985674112
|
||||
3
qwen2-1.5b.Q4_K_S.gguf
Normal file
3
qwen2-1.5b.Q4_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:ce47cbc2a649f675092aeb1e6f2f470c0fa89817da6bc440e319183ce6e06970
|
||||
size 939938176
|
||||
3
qwen2-1.5b.Q5_K_M.gguf
Normal file
3
qwen2-1.5b.Q5_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:fffdb240a63df3636711aad33538323c715f21617a7c058135bbc388e1e050bd
|
||||
size 1124675968
|
||||
3
qwen2-1.5b.Q5_K_S.gguf
Normal file
3
qwen2-1.5b.Q5_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:8a0e4aa00093628556f1a459a95c9f266abbd98f2780574eb67ec12a5f31379f
|
||||
size 1098355072
|
||||
3
qwen2-1.5b.Q6_K.gguf
Normal file
3
qwen2-1.5b.Q6_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:59f15b6694348081744d66fd3731ba775ef268149852b3be6155f723a3f89812
|
||||
size 1272365440
|
||||
3
qwen2-1.5b.Q8_0.gguf
Normal file
3
qwen2-1.5b.Q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:aba57facc869eaa2e24df72de60d2220b18cb79bb628ea0820391c6803fbd9ba
|
||||
size 1646090752
|
||||
3
qwen2-1.5b.f16.gguf
Normal file
3
qwen2-1.5b.f16.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:fc10e6701b34eaafc6b4d348b9d94a0e43a95b3dbdeef26fc137d07412f79e57
|
||||
size 3092769472
|
||||
Reference in New Issue
Block a user