From ea18bd31d1d4a84a06d793a65a5e7fd0d51a9ad7 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Wed, 17 Jun 2026 15:26:24 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF Source: Original Platform --- .gitattributes | 47 ++++++++++++++++++ README.md | 66 +++++++++++++++++++++++++ TLDR-Gemma-2B-MA-PPO-Fixed5.IQ4_XS.gguf | 3 ++ TLDR-Gemma-2B-MA-PPO-Fixed5.Q2_K.gguf | 3 ++ TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_L.gguf | 3 ++ TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_M.gguf | 3 ++ TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_S.gguf | 3 ++ TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_M.gguf | 3 ++ TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_S.gguf | 3 ++ TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_M.gguf | 3 ++ TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_S.gguf | 3 ++ TLDR-Gemma-2B-MA-PPO-Fixed5.Q6_K.gguf | 3 ++ TLDR-Gemma-2B-MA-PPO-Fixed5.Q8_0.gguf | 3 ++ TLDR-Gemma-2B-MA-PPO-Fixed5.f16.gguf | 3 ++ 14 files changed, 149 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 TLDR-Gemma-2B-MA-PPO-Fixed5.IQ4_XS.gguf create mode 100644 TLDR-Gemma-2B-MA-PPO-Fixed5.Q2_K.gguf create mode 100644 TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_L.gguf create mode 100644 TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_M.gguf create mode 100644 TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_S.gguf create mode 100644 TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_M.gguf create mode 100644 TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_S.gguf create mode 100644 TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_M.gguf create mode 100644 TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_S.gguf create mode 100644 TLDR-Gemma-2B-MA-PPO-Fixed5.Q6_K.gguf create mode 100644 TLDR-Gemma-2B-MA-PPO-Fixed5.Q8_0.gguf create mode 100644 TLDR-Gemma-2B-MA-PPO-Fixed5.f16.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..0afc1de --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +TLDR-Gemma-2B-MA-PPO-Fixed5.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +TLDR-Gemma-2B-MA-PPO-Fixed5.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +TLDR-Gemma-2B-MA-PPO-Fixed5.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +TLDR-Gemma-2B-MA-PPO-Fixed5.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +TLDR-Gemma-2B-MA-PPO-Fixed5.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..d97d0ab --- /dev/null +++ b/README.md @@ -0,0 +1,66 @@ +--- +base_model: ernie-research/TLDR-Gemma-2B-MA-PPO-Fixed5 +datasets: +- openai/summarize_from_feedback +language: +- en +library_name: transformers +license: mit +quantized_by: mradermacher +--- +## About + + + + + + +static quants of https://huggingface.co/ernie-research/TLDR-Gemma-2B-MA-PPO-Fixed5 + + +weighted/imatrix quants seem not to be available (by me) at this time. If they do not show up a week or so after the static ones, I have probably not planned for them. Feel free to request them by opening a Community Discussion. +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF/resolve/main/TLDR-Gemma-2B-MA-PPO-Fixed5.Q2_K.gguf) | Q2_K | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF/resolve/main/TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_S.gguf) | Q3_K_S | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF/resolve/main/TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_M.gguf) | Q3_K_M | 1.5 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF/resolve/main/TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_L.gguf) | Q3_K_L | 1.6 | | +| [GGUF](https://huggingface.co/mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF/resolve/main/TLDR-Gemma-2B-MA-PPO-Fixed5.IQ4_XS.gguf) | IQ4_XS | 1.6 | | +| [GGUF](https://huggingface.co/mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF/resolve/main/TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_S.gguf) | Q4_K_S | 1.7 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF/resolve/main/TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_M.gguf) | Q4_K_M | 1.7 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF/resolve/main/TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_S.gguf) | Q5_K_S | 1.9 | | +| [GGUF](https://huggingface.co/mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF/resolve/main/TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_M.gguf) | Q5_K_M | 1.9 | | +| [GGUF](https://huggingface.co/mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF/resolve/main/TLDR-Gemma-2B-MA-PPO-Fixed5.Q6_K.gguf) | Q6_K | 2.2 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF/resolve/main/TLDR-Gemma-2B-MA-PPO-Fixed5.Q8_0.gguf) | Q8_0 | 2.8 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/TLDR-Gemma-2B-MA-PPO-Fixed5-GGUF/resolve/main/TLDR-Gemma-2B-MA-PPO-Fixed5.f16.gguf) | f16 | 5.1 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + + diff --git a/TLDR-Gemma-2B-MA-PPO-Fixed5.IQ4_XS.gguf b/TLDR-Gemma-2B-MA-PPO-Fixed5.IQ4_XS.gguf new file mode 100644 index 0000000..3da2dbd --- /dev/null +++ b/TLDR-Gemma-2B-MA-PPO-Fixed5.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55953bb2d73b32f40c0307dcf160ce16e20c9c218d5007b90645602f44ebcd3d +size 1501219232 diff --git a/TLDR-Gemma-2B-MA-PPO-Fixed5.Q2_K.gguf b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q2_K.gguf new file mode 100644 index 0000000..f5464a5 --- /dev/null +++ b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1578a4f2cbfe9cbcc7e9e0d4746d9f2945e7851fd1c430187b2bb10e70e10b3 +size 1157925280 diff --git a/TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_L.gguf b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_L.gguf new file mode 100644 index 0000000..445bb40 --- /dev/null +++ b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f93a5539507c31a3903cdde53d77dd2c8dcf5c3e9e37afc4598a1efd393607 +size 1465592224 diff --git a/TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_M.gguf b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_M.gguf new file mode 100644 index 0000000..f8c6933 --- /dev/null +++ b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e2501e0f3d7ed9c818d12d531800560bed3dc897b1ecfa757bcaec4dda7a72d +size 1383803296 diff --git a/TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_S.gguf b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_S.gguf new file mode 100644 index 0000000..5aaa56b --- /dev/null +++ b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8111ca33d263883acfcb9cc27f4895f99593b1205b50358f3cef861ce3e6d20c +size 1287981472 diff --git a/TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_M.gguf b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_M.gguf new file mode 100644 index 0000000..3dce82f --- /dev/null +++ b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e273936b5be355885d66371189d24d5821786b387f75e6e713b6c924faf98b2 +size 1630263712 diff --git a/TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_S.gguf b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_S.gguf new file mode 100644 index 0000000..93f398e --- /dev/null +++ b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5119d1b82999fa2381fc56327a1ce1c78d9326765e4406ae4d379e840b214366 +size 1559841184 diff --git a/TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_M.gguf b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_M.gguf new file mode 100644 index 0000000..bfb13d9 --- /dev/null +++ b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94cdb6ae44aac9c39b9ef6ada70e375f18aae4a535ce31d38bcfcd3aec40d51f +size 1839651232 diff --git a/TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_S.gguf b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_S.gguf new file mode 100644 index 0000000..4ab8c4d --- /dev/null +++ b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b254d991dcc75cc307e719e062e5177c0cde0a4d21316e5da8c034641407e7d +size 1798916512 diff --git a/TLDR-Gemma-2B-MA-PPO-Fixed5.Q6_K.gguf b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q6_K.gguf new file mode 100644 index 0000000..a84f553 --- /dev/null +++ b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:881bdd90a27ca04e4b942e2eb48adbd3c094d9f7071b1d04f912b6eec567ff42 +size 2062125472 diff --git a/TLDR-Gemma-2B-MA-PPO-Fixed5.Q8_0.gguf b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q8_0.gguf new file mode 100644 index 0000000..0cf93c5 --- /dev/null +++ b/TLDR-Gemma-2B-MA-PPO-Fixed5.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f36bf7a79fbc6c13de0def2218e005b136a53cbc83bfd83189735b78ffe670f6 +size 2669070752 diff --git a/TLDR-Gemma-2B-MA-PPO-Fixed5.f16.gguf b/TLDR-Gemma-2B-MA-PPO-Fixed5.f16.gguf new file mode 100644 index 0000000..fcfa12e --- /dev/null +++ b/TLDR-Gemma-2B-MA-PPO-Fixed5.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fb2955101e642304cc4d1433240622756ed093413919051b346d524fa7424df +size 5018536352