commit faccad5dfca185605db0e14e5323dcd8a5bc30a3 Author: ModelHub XC Date: Wed Apr 22 05:53:00 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..ed504f0 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Barcenas-Nemotron-Qwen3-4B-Instruct.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Barcenas-Nemotron-Qwen3-4B-Instruct.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Barcenas-Nemotron-Qwen3-4B-Instruct.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Barcenas-Nemotron-Qwen3-4B-Instruct.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Barcenas-Nemotron-Qwen3-4B-Instruct.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Barcenas-Nemotron-Qwen3-4B-Instruct.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Barcenas-Nemotron-Qwen3-4B-Instruct.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Barcenas-Nemotron-Qwen3-4B-Instruct.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +Barcenas-Nemotron-Qwen3-4B-Instruct.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Barcenas-Nemotron-Qwen3-4B-Instruct.IQ4_XS.gguf b/Barcenas-Nemotron-Qwen3-4B-Instruct.IQ4_XS.gguf new file mode 100644 index 0000000..ad8854d --- /dev/null +++ b/Barcenas-Nemotron-Qwen3-4B-Instruct.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a02940620a7c648bb92862207cfab400e60c2dfeb10b315ab91231933a50f83 +size 2286315744 diff --git a/Barcenas-Nemotron-Qwen3-4B-Instruct.Q2_K.gguf b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q2_K.gguf new file mode 100644 index 0000000..f91a0e4 --- /dev/null +++ b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a50fb0bda1ecaeb5b6057b9dcca3516bb2a7d1bd6bc55fb00b476816ce31fbe3 +size 1669499104 diff --git a/Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_L.gguf b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_L.gguf new file mode 100644 index 0000000..73efb35 --- /dev/null +++ b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbbd7160d6769fe82a40bce7f2a2422f509ce160d73d52307528a95053134bfe +size 2239785184 diff --git a/Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_M.gguf b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_M.gguf new file mode 100644 index 0000000..a83d594 --- /dev/null +++ b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ada4aaa0f75506ed59c8b9567b7b3221d617cb5dea3a1dd103d816816d5e36b +size 2075617504 diff --git a/Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_S.gguf b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_S.gguf new file mode 100644 index 0000000..c3ae286 --- /dev/null +++ b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45aaed172fc530a93c717a4c0b128762850b0657372151130162175f84d32014 +size 1886996704 diff --git a/Barcenas-Nemotron-Qwen3-4B-Instruct.Q4_K_M.gguf b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q4_K_M.gguf new file mode 100644 index 0000000..d555318 --- /dev/null +++ b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb1e8fad30a566c5a4a35ea0961da9a765282ecfc30c8737711e2a6728d806a8 +size 2497280224 diff --git a/Barcenas-Nemotron-Qwen3-4B-Instruct.Q4_K_S.gguf b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q4_K_S.gguf new file mode 100644 index 0000000..72929bc --- /dev/null +++ b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d6fbd900ca2f1aeaa27f4af27200c9983197ae189dc98191720220efc50bb19 +size 2383309024 diff --git a/Barcenas-Nemotron-Qwen3-4B-Instruct.Q5_K_M.gguf b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q5_K_M.gguf new file mode 100644 index 0000000..10063a1 --- /dev/null +++ b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df0066e88149a7d07e3609400f0c64bba4352755e148496e8e92475ec35fb4ee +size 2889513184 diff --git a/Barcenas-Nemotron-Qwen3-4B-Instruct.Q5_K_S.gguf b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q5_K_S.gguf new file mode 100644 index 0000000..88fbe62 --- /dev/null +++ b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f719f1ced5b664c90273dae15634d86dde4d9101c26b827b543ff19fecd672d +size 2823710944 diff --git a/Barcenas-Nemotron-Qwen3-4B-Instruct.Q6_K.gguf b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q6_K.gguf new file mode 100644 index 0000000..fd85eb0 --- /dev/null +++ b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b832497358da47e7c9b0274b2b2f0e2548ecd6fd1916f76c004d774d3dbb04f4 +size 3306260704 diff --git a/Barcenas-Nemotron-Qwen3-4B-Instruct.Q8_0.gguf b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q8_0.gguf new file mode 100644 index 0000000..ea43e31 --- /dev/null +++ b/Barcenas-Nemotron-Qwen3-4B-Instruct.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce87d66758246f1bd22dac66585a9536028d6d79ea56d3b088b4060fef7d115d +size 4280404704 diff --git a/Barcenas-Nemotron-Qwen3-4B-Instruct.f16.gguf b/Barcenas-Nemotron-Qwen3-4B-Instruct.f16.gguf new file mode 100644 index 0000000..774cc8a --- /dev/null +++ b/Barcenas-Nemotron-Qwen3-4B-Instruct.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3d2dda0e6697c41bbb7ba5dd378c3f97b8f3e36a288c90ea7614a686236c577 +size 8051284704 diff --git a/README.md b/README.md new file mode 100644 index 0000000..2fc3aca --- /dev/null +++ b/README.md @@ -0,0 +1,74 @@ +--- +base_model: Danielbrdz/Barcenas-Nemotron-Qwen3-4B-Instruct +datasets: +- nvidia/Nemotron-Instruction-Following-Chat-v1 +language: +- en +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +--- +## About + + + + + + + + + +static quants of https://huggingface.co/Danielbrdz/Barcenas-Nemotron-Qwen3-4B-Instruct + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF).*** + +weighted/imatrix quants are available at https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-i1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF/resolve/main/Barcenas-Nemotron-Qwen3-4B-Instruct.Q2_K.gguf) | Q2_K | 1.8 | | +| [GGUF](https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF/resolve/main/Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_S.gguf) | Q3_K_S | 2.0 | | +| [GGUF](https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF/resolve/main/Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_M.gguf) | Q3_K_M | 2.2 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF/resolve/main/Barcenas-Nemotron-Qwen3-4B-Instruct.Q3_K_L.gguf) | Q3_K_L | 2.3 | | +| [GGUF](https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF/resolve/main/Barcenas-Nemotron-Qwen3-4B-Instruct.IQ4_XS.gguf) | IQ4_XS | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF/resolve/main/Barcenas-Nemotron-Qwen3-4B-Instruct.Q4_K_S.gguf) | Q4_K_S | 2.5 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF/resolve/main/Barcenas-Nemotron-Qwen3-4B-Instruct.Q4_K_M.gguf) | Q4_K_M | 2.6 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF/resolve/main/Barcenas-Nemotron-Qwen3-4B-Instruct.Q5_K_S.gguf) | Q5_K_S | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF/resolve/main/Barcenas-Nemotron-Qwen3-4B-Instruct.Q5_K_M.gguf) | Q5_K_M | 3.0 | | +| [GGUF](https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF/resolve/main/Barcenas-Nemotron-Qwen3-4B-Instruct.Q6_K.gguf) | Q6_K | 3.4 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF/resolve/main/Barcenas-Nemotron-Qwen3-4B-Instruct.Q8_0.gguf) | Q8_0 | 4.4 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/Barcenas-Nemotron-Qwen3-4B-Instruct-GGUF/resolve/main/Barcenas-Nemotron-Qwen3-4B-Instruct.f16.gguf) | f16 | 8.2 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + +