commit 07c747b81bedd9628b7c34f834074b3a4356d0d2 Author: ModelHub XC Date: Sat May 9 05:07:56 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/phi4-reasoning-supervisor-v1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..0000cc8 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,46 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +phi4-reasoning-supervisor-v1.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +phi4-reasoning-supervisor-v1.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +phi4-reasoning-supervisor-v1.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +phi4-reasoning-supervisor-v1.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +phi4-reasoning-supervisor-v1.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +phi4-reasoning-supervisor-v1.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +phi4-reasoning-supervisor-v1.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +phi4-reasoning-supervisor-v1.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +phi4-reasoning-supervisor-v1.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +phi4-reasoning-supervisor-v1.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +phi4-reasoning-supervisor-v1.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..33325ee --- /dev/null +++ b/README.md @@ -0,0 +1,76 @@ +--- +base_model: shareit/phi4-reasoning-supervisor-v1 +language: +- en +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- text-generation-inference +- transformers +- unsloth +- phi3 +--- +## About + + + + + + + + + +static quants of https://huggingface.co/shareit/phi4-reasoning-supervisor-v1 + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#phi4-reasoning-supervisor-v1-GGUF).*** + +weighted/imatrix quants seem not to be available (by me) at this time. If they do not show up a week or so after the static ones, I have probably not planned for them. Feel free to request them by opening a Community Discussion. +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/phi4-reasoning-supervisor-v1-GGUF/resolve/main/phi4-reasoning-supervisor-v1.Q2_K.gguf) | Q2_K | 6.0 | | +| [GGUF](https://huggingface.co/mradermacher/phi4-reasoning-supervisor-v1-GGUF/resolve/main/phi4-reasoning-supervisor-v1.Q3_K_S.gguf) | Q3_K_S | 6.6 | | +| [GGUF](https://huggingface.co/mradermacher/phi4-reasoning-supervisor-v1-GGUF/resolve/main/phi4-reasoning-supervisor-v1.Q3_K_M.gguf) | Q3_K_M | 7.5 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/phi4-reasoning-supervisor-v1-GGUF/resolve/main/phi4-reasoning-supervisor-v1.Q3_K_L.gguf) | Q3_K_L | 8.2 | | +| [GGUF](https://huggingface.co/mradermacher/phi4-reasoning-supervisor-v1-GGUF/resolve/main/phi4-reasoning-supervisor-v1.IQ4_XS.gguf) | IQ4_XS | 8.4 | | +| [GGUF](https://huggingface.co/mradermacher/phi4-reasoning-supervisor-v1-GGUF/resolve/main/phi4-reasoning-supervisor-v1.Q4_K_S.gguf) | Q4_K_S | 8.6 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/phi4-reasoning-supervisor-v1-GGUF/resolve/main/phi4-reasoning-supervisor-v1.Q4_K_M.gguf) | Q4_K_M | 9.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/phi4-reasoning-supervisor-v1-GGUF/resolve/main/phi4-reasoning-supervisor-v1.Q5_K_S.gguf) | Q5_K_S | 10.3 | | +| [GGUF](https://huggingface.co/mradermacher/phi4-reasoning-supervisor-v1-GGUF/resolve/main/phi4-reasoning-supervisor-v1.Q5_K_M.gguf) | Q5_K_M | 10.6 | | +| [GGUF](https://huggingface.co/mradermacher/phi4-reasoning-supervisor-v1-GGUF/resolve/main/phi4-reasoning-supervisor-v1.Q6_K.gguf) | Q6_K | 12.1 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/phi4-reasoning-supervisor-v1-GGUF/resolve/main/phi4-reasoning-supervisor-v1.Q8_0.gguf) | Q8_0 | 15.7 | fast, best quality | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + + diff --git a/phi4-reasoning-supervisor-v1.IQ4_XS.gguf b/phi4-reasoning-supervisor-v1.IQ4_XS.gguf new file mode 100644 index 0000000..da4bf75 --- /dev/null +++ b/phi4-reasoning-supervisor-v1.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9ed9f0976cec92d97fbe1784a50d389d5bb13a26a955c8e4e3489f9dcf28c1b +size 8258818912 diff --git a/phi4-reasoning-supervisor-v1.Q2_K.gguf b/phi4-reasoning-supervisor-v1.Q2_K.gguf new file mode 100644 index 0000000..335e325 --- /dev/null +++ b/phi4-reasoning-supervisor-v1.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d4e0518e813d1ebed53d7cc38ceb4321737606937f420569380b9c4618036bf +size 5915988832 diff --git a/phi4-reasoning-supervisor-v1.Q3_K_L.gguf b/phi4-reasoning-supervisor-v1.Q3_K_L.gguf new file mode 100644 index 0000000..88f5965 --- /dev/null +++ b/phi4-reasoning-supervisor-v1.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72f08a2e6af833576cfc61ea3e86451410ae042168b4dcd715e5331621e7ccf3 +size 8126763872 diff --git a/phi4-reasoning-supervisor-v1.Q3_K_M.gguf b/phi4-reasoning-supervisor-v1.Q3_K_M.gguf new file mode 100644 index 0000000..145d605 --- /dev/null +++ b/phi4-reasoning-supervisor-v1.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5869f7d3a9dfa06ad81cb3bdfc848fbd33f635b22b6225df54b4c5dbba2c0fbc +size 7373099872 diff --git a/phi4-reasoning-supervisor-v1.Q3_K_S.gguf b/phi4-reasoning-supervisor-v1.Q3_K_S.gguf new file mode 100644 index 0000000..d09e8c2 --- /dev/null +++ b/phi4-reasoning-supervisor-v1.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:450ec1323f6f8b4fc41501692ca58b942a15551a8ff29b491d7cd18f4b3db1a8 +size 6504747872 diff --git a/phi4-reasoning-supervisor-v1.Q4_K_M.gguf b/phi4-reasoning-supervisor-v1.Q4_K_M.gguf new file mode 100644 index 0000000..1d7bd3d --- /dev/null +++ b/phi4-reasoning-supervisor-v1.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:231c57dd50524fd7fea5488f483cd19737e897639211ff781a2609bf844133c4 +size 9059259232 diff --git a/phi4-reasoning-supervisor-v1.Q4_K_S.gguf b/phi4-reasoning-supervisor-v1.Q4_K_S.gguf new file mode 100644 index 0000000..b96c94b --- /dev/null +++ b/phi4-reasoning-supervisor-v1.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73303fd6b42ec3c617fab5f41da7e728c612f3ad9b859417500736ecd25e0ed1 +size 8460424032 diff --git a/phi4-reasoning-supervisor-v1.Q5_K_M.gguf b/phi4-reasoning-supervisor-v1.Q5_K_M.gguf new file mode 100644 index 0000000..2144782 --- /dev/null +++ b/phi4-reasoning-supervisor-v1.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f57ec0df281436f55f919064b2725257dd4897d8c9d78ae3111ad4a820499933 +size 10499740512 diff --git a/phi4-reasoning-supervisor-v1.Q5_K_S.gguf b/phi4-reasoning-supervisor-v1.Q5_K_S.gguf new file mode 100644 index 0000000..1617469 --- /dev/null +++ b/phi4-reasoning-supervisor-v1.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:178465b94557e4d5670314196e613c5f7e3b60e5a1915a23c32d42f1d28605b0 +size 10151580512 diff --git a/phi4-reasoning-supervisor-v1.Q6_K.gguf b/phi4-reasoning-supervisor-v1.Q6_K.gguf new file mode 100644 index 0000000..d6f5176 --- /dev/null +++ b/phi4-reasoning-supervisor-v1.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd5455d8da5d310753563b8bffcbc9f18a1a7cb510518108763787af990e02a8 +size 12030251872 diff --git a/phi4-reasoning-supervisor-v1.Q8_0.gguf b/phi4-reasoning-supervisor-v1.Q8_0.gguf new file mode 100644 index 0000000..4ca72d2 --- /dev/null +++ b/phi4-reasoning-supervisor-v1.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf7e8655ca989ff8be4f38ffe8f2f362290816602d7508e0df3546b75dd14a5c +size 15580500832