From 3a91c332318dc659abfdec1fa6386f04b1defcb8 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sun, 21 Jun 2026 20:11:19 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/MemPrivacy-1.7B-SFT-GGUF Source: Original Platform --- .gitattributes | 47 ++++++++++++++++++ MemPrivacy-1.7B-SFT.IQ4_XS.gguf | 3 ++ MemPrivacy-1.7B-SFT.Q2_K.gguf | 3 ++ MemPrivacy-1.7B-SFT.Q3_K_L.gguf | 3 ++ MemPrivacy-1.7B-SFT.Q3_K_M.gguf | 3 ++ MemPrivacy-1.7B-SFT.Q3_K_S.gguf | 3 ++ MemPrivacy-1.7B-SFT.Q4_K_M.gguf | 3 ++ MemPrivacy-1.7B-SFT.Q4_K_S.gguf | 3 ++ MemPrivacy-1.7B-SFT.Q5_K_M.gguf | 3 ++ MemPrivacy-1.7B-SFT.Q5_K_S.gguf | 3 ++ MemPrivacy-1.7B-SFT.Q6_K.gguf | 3 ++ MemPrivacy-1.7B-SFT.Q8_0.gguf | 3 ++ MemPrivacy-1.7B-SFT.f16.gguf | 3 ++ README.md | 86 +++++++++++++++++++++++++++++++++ 14 files changed, 169 insertions(+) create mode 100644 .gitattributes create mode 100644 MemPrivacy-1.7B-SFT.IQ4_XS.gguf create mode 100644 MemPrivacy-1.7B-SFT.Q2_K.gguf create mode 100644 MemPrivacy-1.7B-SFT.Q3_K_L.gguf create mode 100644 MemPrivacy-1.7B-SFT.Q3_K_M.gguf create mode 100644 MemPrivacy-1.7B-SFT.Q3_K_S.gguf create mode 100644 MemPrivacy-1.7B-SFT.Q4_K_M.gguf create mode 100644 MemPrivacy-1.7B-SFT.Q4_K_S.gguf create mode 100644 MemPrivacy-1.7B-SFT.Q5_K_M.gguf create mode 100644 MemPrivacy-1.7B-SFT.Q5_K_S.gguf create mode 100644 MemPrivacy-1.7B-SFT.Q6_K.gguf create mode 100644 MemPrivacy-1.7B-SFT.Q8_0.gguf create mode 100644 MemPrivacy-1.7B-SFT.f16.gguf create mode 100644 README.md diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..f2a16ef --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +MemPrivacy-1.7B-SFT.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +MemPrivacy-1.7B-SFT.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +MemPrivacy-1.7B-SFT.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +MemPrivacy-1.7B-SFT.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MemPrivacy-1.7B-SFT.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MemPrivacy-1.7B-SFT.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MemPrivacy-1.7B-SFT.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MemPrivacy-1.7B-SFT.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MemPrivacy-1.7B-SFT.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MemPrivacy-1.7B-SFT.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +MemPrivacy-1.7B-SFT.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +MemPrivacy-1.7B-SFT.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/MemPrivacy-1.7B-SFT.IQ4_XS.gguf b/MemPrivacy-1.7B-SFT.IQ4_XS.gguf new file mode 100644 index 0000000..5137441 --- /dev/null +++ b/MemPrivacy-1.7B-SFT.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f21b9323de1db6db6468341dd897dbe198b28a0193527307f8a8b754719b95df +size 1016281664 diff --git a/MemPrivacy-1.7B-SFT.Q2_K.gguf b/MemPrivacy-1.7B-SFT.Q2_K.gguf new file mode 100644 index 0000000..ec0d2d4 --- /dev/null +++ b/MemPrivacy-1.7B-SFT.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98f007066f4029be2a2d597e101a26376861ca77eda2b5c36dd2f242d1608542 +size 777796160 diff --git a/MemPrivacy-1.7B-SFT.Q3_K_L.gguf b/MemPrivacy-1.7B-SFT.Q3_K_L.gguf new file mode 100644 index 0000000..861e7f7 --- /dev/null +++ b/MemPrivacy-1.7B-SFT.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29e500687b3ed814eb2018670f62ff29d9df0350ad1f55a9ab72194b0efae00d +size 1003502144 diff --git a/MemPrivacy-1.7B-SFT.Q3_K_M.gguf b/MemPrivacy-1.7B-SFT.Q3_K_M.gguf new file mode 100644 index 0000000..78b16c1 --- /dev/null +++ b/MemPrivacy-1.7B-SFT.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ea3142bc54c6385d5c199bc424653af37ae1c4cfadca0f77625f783423fca7 +size 939539008 diff --git a/MemPrivacy-1.7B-SFT.Q3_K_S.gguf b/MemPrivacy-1.7B-SFT.Q3_K_S.gguf new file mode 100644 index 0000000..27de3fd --- /dev/null +++ b/MemPrivacy-1.7B-SFT.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3caa89c4a45d32e9a5df4c28da3844f70431cc7f56da9dc42a97ef8f5bd0598b +size 867252800 diff --git a/MemPrivacy-1.7B-SFT.Q4_K_M.gguf b/MemPrivacy-1.7B-SFT.Q4_K_M.gguf new file mode 100644 index 0000000..1606ab2 --- /dev/null +++ b/MemPrivacy-1.7B-SFT.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48767d34fe205b60d1c475ec7b9ff589c4ab96f28ebb9f6ef91c111cc4666135 +size 1107409472 diff --git a/MemPrivacy-1.7B-SFT.Q4_K_S.gguf b/MemPrivacy-1.7B-SFT.Q4_K_S.gguf new file mode 100644 index 0000000..d795946 --- /dev/null +++ b/MemPrivacy-1.7B-SFT.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d56a0c3550277eb7a51a05461e8e61f52848b7531687c94485ab3ea8892fae7b +size 1060190784 diff --git a/MemPrivacy-1.7B-SFT.Q5_K_M.gguf b/MemPrivacy-1.7B-SFT.Q5_K_M.gguf new file mode 100644 index 0000000..0459207 --- /dev/null +++ b/MemPrivacy-1.7B-SFT.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00e1aa57240700997b0b9fcc54abe30c91b92d31733c04910aaca12c2eae05eb +size 1257880128 diff --git a/MemPrivacy-1.7B-SFT.Q5_K_S.gguf b/MemPrivacy-1.7B-SFT.Q5_K_S.gguf new file mode 100644 index 0000000..b6bfe73 --- /dev/null +++ b/MemPrivacy-1.7B-SFT.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cb4ffbcd97c78c58310088a7efcd3e97347bc8a4f576c308bc22c75de100a83 +size 1230584384 diff --git a/MemPrivacy-1.7B-SFT.Q6_K.gguf b/MemPrivacy-1.7B-SFT.Q6_K.gguf new file mode 100644 index 0000000..8e76292 --- /dev/null +++ b/MemPrivacy-1.7B-SFT.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:989215f3de3ad50e0cf03c2d65f54c952464ddd7f40bd2a8a270730d1393f701 +size 1417755200 diff --git a/MemPrivacy-1.7B-SFT.Q8_0.gguf b/MemPrivacy-1.7B-SFT.Q8_0.gguf new file mode 100644 index 0000000..618c32a --- /dev/null +++ b/MemPrivacy-1.7B-SFT.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f483e4d7c70938debe166b0d5c64d3bace7b23ce431fd8e2b5103c88d6b5aa8 +size 1834426944 diff --git a/MemPrivacy-1.7B-SFT.f16.gguf b/MemPrivacy-1.7B-SFT.f16.gguf new file mode 100644 index 0000000..81d7c64 --- /dev/null +++ b/MemPrivacy-1.7B-SFT.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29061b14ccb1d0f569688b0d122a66eed361af5e504b297dad921f936581250f +size 3447349824 diff --git a/README.md b/README.md new file mode 100644 index 0000000..6277a89 --- /dev/null +++ b/README.md @@ -0,0 +1,86 @@ +--- +arxiv: 2605.09530 +base_model: IAAR-Shanghai/MemPrivacy-1.7B-SFT +language: +- en +- zh +library_name: transformers +license: cc-by-nc-nd-4.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- privacy +- privacy-detection +- memory +- personalized-memory +- memory-system +- memory-management +- agent +- agent-memory +- information-security +- information-extraction +- edge-cloud +--- +## About + + + + + + + + + +static quants of https://huggingface.co/IAAR-Shanghai/MemPrivacy-1.7B-SFT + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#MemPrivacy-1.7B-SFT-GGUF).*** + +weighted/imatrix quants seem not to be available (by me) at this time. If they do not show up a week or so after the static ones, I have probably not planned for them. Feel free to request them by opening a Community Discussion. +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/MemPrivacy-1.7B-SFT-GGUF/resolve/main/MemPrivacy-1.7B-SFT.Q2_K.gguf) | Q2_K | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/MemPrivacy-1.7B-SFT-GGUF/resolve/main/MemPrivacy-1.7B-SFT.Q3_K_S.gguf) | Q3_K_S | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/MemPrivacy-1.7B-SFT-GGUF/resolve/main/MemPrivacy-1.7B-SFT.Q3_K_M.gguf) | Q3_K_M | 1.0 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/MemPrivacy-1.7B-SFT-GGUF/resolve/main/MemPrivacy-1.7B-SFT.Q3_K_L.gguf) | Q3_K_L | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/MemPrivacy-1.7B-SFT-GGUF/resolve/main/MemPrivacy-1.7B-SFT.IQ4_XS.gguf) | IQ4_XS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/MemPrivacy-1.7B-SFT-GGUF/resolve/main/MemPrivacy-1.7B-SFT.Q4_K_S.gguf) | Q4_K_S | 1.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/MemPrivacy-1.7B-SFT-GGUF/resolve/main/MemPrivacy-1.7B-SFT.Q4_K_M.gguf) | Q4_K_M | 1.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/MemPrivacy-1.7B-SFT-GGUF/resolve/main/MemPrivacy-1.7B-SFT.Q5_K_S.gguf) | Q5_K_S | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/MemPrivacy-1.7B-SFT-GGUF/resolve/main/MemPrivacy-1.7B-SFT.Q5_K_M.gguf) | Q5_K_M | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/MemPrivacy-1.7B-SFT-GGUF/resolve/main/MemPrivacy-1.7B-SFT.Q6_K.gguf) | Q6_K | 1.5 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/MemPrivacy-1.7B-SFT-GGUF/resolve/main/MemPrivacy-1.7B-SFT.Q8_0.gguf) | Q8_0 | 1.9 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/MemPrivacy-1.7B-SFT-GGUF/resolve/main/MemPrivacy-1.7B-SFT.f16.gguf) | f16 | 3.5 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + +