commit 74a0130da4fbb02b681b63a8c15f43eaf585cf8a Author: ModelHub XC Date: Sat May 9 20:14:15 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..76d037f --- /dev/null +++ b/.gitattributes @@ -0,0 +1,58 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +BgGPT-7B-Instruct-v0.1.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/BgGPT-7B-Instruct-v0.1.i1-IQ1_M.gguf b/BgGPT-7B-Instruct-v0.1.i1-IQ1_M.gguf new file mode 100644 index 0000000..b6a54b7 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd53e6e94957c8cf08eab31ed4bf0028cd1b73b902e060c3722b87b6cb6fe3fe +size 1779580320 diff --git a/BgGPT-7B-Instruct-v0.1.i1-IQ1_S.gguf b/BgGPT-7B-Instruct-v0.1.i1-IQ1_S.gguf new file mode 100644 index 0000000..ee11341 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d20cff7f98ec11ff0d0311246a466a7dbe3e450a1b56143c0fae46aa158277a5 +size 1637236128 diff --git a/BgGPT-7B-Instruct-v0.1.i1-IQ2_M.gguf b/BgGPT-7B-Instruct-v0.1.i1-IQ2_M.gguf new file mode 100644 index 0000000..45fae3a --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb2e65f242aef8e3750f31f474a00c54482ad5d47271818ca81a49ee6354c06d +size 2528342944 diff --git a/BgGPT-7B-Instruct-v0.1.i1-IQ2_S.gguf b/BgGPT-7B-Instruct-v0.1.i1-IQ2_S.gguf new file mode 100644 index 0000000..40f56ac --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2ae550e4fbdc09a5b5e94801459884461ba0acfd0fb510dec76437dae9f8bbf +size 2338550688 diff --git a/BgGPT-7B-Instruct-v0.1.i1-IQ2_XS.gguf b/BgGPT-7B-Instruct-v0.1.i1-IQ2_XS.gguf new file mode 100644 index 0000000..f824a5e --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33d7b51fdf544bd748322ae847f749b5a498e45319c1308eaf13ae095afbd67a +size 2223390112 diff --git a/BgGPT-7B-Instruct-v0.1.i1-IQ2_XXS.gguf b/BgGPT-7B-Instruct-v0.1.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..b087855 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:053f30328b439db0d11620121955a28abab30e35cdba5fd8e36b5709f6c1ba54 +size 2016820640 diff --git a/BgGPT-7B-Instruct-v0.1.i1-IQ3_M.gguf b/BgGPT-7B-Instruct-v0.1.i1-IQ3_M.gguf new file mode 100644 index 0000000..a834bfd --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50ed107718df69270e6841cd750d6ed09bb70ff89b76cbc03a15d3448a1637cd +size 3315786144 diff --git a/BgGPT-7B-Instruct-v0.1.i1-IQ3_S.gguf b/BgGPT-7B-Instruct-v0.1.i1-IQ3_S.gguf new file mode 100644 index 0000000..76ce54f --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d9a4386ece3f5a1f57e94adcd3d375ff20811026b6911a7bd63fbafd27c3459 +size 3213287840 diff --git a/BgGPT-7B-Instruct-v0.1.i1-IQ3_XS.gguf b/BgGPT-7B-Instruct-v0.1.i1-IQ3_XS.gguf new file mode 100644 index 0000000..bef170b --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327b5aefeaf41c05300d6bc48cfeb7dd42f22f83af2b5e944ff641563ec9b503 +size 3049709984 diff --git a/BgGPT-7B-Instruct-v0.1.i1-IQ3_XXS.gguf b/BgGPT-7B-Instruct-v0.1.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..1d6b7d2 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab6e8c1faf7ae9eb58977536c2614d4879104f6c373fd4600f0739835e81354f +size 2854974368 diff --git a/BgGPT-7B-Instruct-v0.1.i1-IQ4_XS.gguf b/BgGPT-7B-Instruct-v0.1.i1-IQ4_XS.gguf new file mode 100644 index 0000000..8de6f56 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4601cfc094b6950b51536472bda33a6c887bd6fca6b1fae7a132257839092fc0 +size 3941078944 diff --git a/BgGPT-7B-Instruct-v0.1.i1-Q2_K.gguf b/BgGPT-7B-Instruct-v0.1.i1-Q2_K.gguf new file mode 100644 index 0000000..92593a0 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6ef18a06b17069c60bf9af59d5eedab9ff49dc8b97f9692528047b7ec43c469 +size 2747640736 diff --git a/BgGPT-7B-Instruct-v0.1.i1-Q2_K_S.gguf b/BgGPT-7B-Instruct-v0.1.i1-Q2_K_S.gguf new file mode 100644 index 0000000..f1820e3 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fafbeda636de1fc49965aa081f19e2991818b9b0c708ae062f62ca745e1d0ca +size 2557324192 diff --git a/BgGPT-7B-Instruct-v0.1.i1-Q3_K_L.gguf b/BgGPT-7B-Instruct-v0.1.i1-Q3_K_L.gguf new file mode 100644 index 0000000..a8851e0 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:448fe400362819f954bbe673ffdb06f10e93abf0e2eea32aaa723d1d39fbd09b +size 3852919200 diff --git a/BgGPT-7B-Instruct-v0.1.i1-Q3_K_M.gguf b/BgGPT-7B-Instruct-v0.1.i1-Q3_K_M.gguf new file mode 100644 index 0000000..a1487fb --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf05d5ac073451cfee7901611e8e8cae130cfe164855352331ee0560abc0fee5 +size 3549880736 diff --git a/BgGPT-7B-Instruct-v0.1.i1-Q3_K_S.gguf b/BgGPT-7B-Instruct-v0.1.i1-Q3_K_S.gguf new file mode 100644 index 0000000..f41273e --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a779e2da0c352feb971b5cb434819d2f8c55c66c155ea4a0b9c0580b137c3bfc +size 3195462048 diff --git a/BgGPT-7B-Instruct-v0.1.i1-Q4_0.gguf b/BgGPT-7B-Instruct-v0.1.i1-Q4_0.gguf new file mode 100644 index 0000000..9df9283 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6261b9af71bfa93edfbc57c82f44f080928c1634bb74e034fb03ced709184c9f +size 4157755296 diff --git a/BgGPT-7B-Instruct-v0.1.i1-Q4_K_M.gguf b/BgGPT-7B-Instruct-v0.1.i1-Q4_K_M.gguf new file mode 100644 index 0000000..b286674 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:107f8dabb56d27c9954de99d73f7480af415946a69434a6425e0bb38bfff8971 +size 4402597792 diff --git a/BgGPT-7B-Instruct-v0.1.i1-Q4_K_S.gguf b/BgGPT-7B-Instruct-v0.1.i1-Q4_K_S.gguf new file mode 100644 index 0000000..ea39c39 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2b358c97effd8290b695e0e505efeeb3bd18a24ce1f7fb32ff15c11de769ab9 +size 4174532512 diff --git a/BgGPT-7B-Instruct-v0.1.i1-Q5_K_M.gguf b/BgGPT-7B-Instruct-v0.1.i1-Q5_K_M.gguf new file mode 100644 index 0000000..938f6c7 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c5cd39c92f4093bfeb5089fd559a6c160ec8cb9e2a97403513390b14244347 +size 5168639904 diff --git a/BgGPT-7B-Instruct-v0.1.i1-Q5_K_S.gguf b/BgGPT-7B-Instruct-v0.1.i1-Q5_K_S.gguf new file mode 100644 index 0000000..63c57bf --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14ca8fed442640f99f789e417c4dc9d64b2e34075e1b7e862423320f8aaf9e80 +size 5034946464 diff --git a/BgGPT-7B-Instruct-v0.1.i1-Q6_K.gguf b/BgGPT-7B-Instruct-v0.1.i1-Q6_K.gguf new file mode 100644 index 0000000..8094635 --- /dev/null +++ b/BgGPT-7B-Instruct-v0.1.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45131500a0b4f9c9eb6dc6be688bc528b211095dfe09fde16f142164261ebe1e +size 5982559648 diff --git a/README.md b/README.md new file mode 100644 index 0000000..48b03a4 --- /dev/null +++ b/README.md @@ -0,0 +1,79 @@ +--- +base_model: INSAIT-Institute/BgGPT-7B-Instruct-v0.1 +language: +- bg +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- mistral +- instruct +- bggpt +- insait +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/INSAIT-Institute/BgGPT-7B-Instruct-v0.1 + + +static quants are available at https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-IQ1_S.gguf) | i1-IQ1_S | 1.7 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-IQ1_M.gguf) | i1-IQ1_M | 1.9 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.1 | | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.3 | | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-IQ2_S.gguf) | i1-IQ2_S | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-IQ2_M.gguf) | i1-IQ2_M | 2.6 | | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-Q2_K_S.gguf) | i1-Q2_K_S | 2.7 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-Q2_K.gguf) | i1-Q2_K | 2.8 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.0 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.1 | | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.3 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-IQ3_S.gguf) | i1-IQ3_S | 3.3 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-IQ3_M.gguf) | i1-IQ3_M | 3.4 | | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-Q3_K_M.gguf) | i1-Q3_K_M | 3.6 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.0 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.0 | | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-Q4_0.gguf) | i1-Q4_0 | 4.3 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.3 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-Q4_K_M.gguf) | i1-Q4_K_M | 4.5 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.1 | | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.3 | | +| [GGUF](https://huggingface.co/mradermacher/BgGPT-7B-Instruct-v0.1-i1-GGUF/resolve/main/BgGPT-7B-Instruct-v0.1.i1-Q6_K.gguf) | i1-Q6_K | 6.1 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..63dc03c --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c512d5bd975cf003c8a51635819e5451ee547ea4f53cbf286303a9f7d0db5d29 +size 4988157