From 1d2141706cc98f30ead07e3cb9fda177226c8f96 Mon Sep 17 00:00:00 2001
From: ModelHub XC <noreply@modelhub.org.cn>
Date: Mon, 22 Jun 2026 05:21:17 +0800
Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?=
 =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?=
 =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Model: DevQuasar-7/nvidia.Nemotron-Mini-4B-Instruct-GGUF
Source: Original Platform
---
 .gitattributes                               | 46 ++++++++++++++++++++
 README.md                                    | 20 +++++++++
 nvidia.Nemotron-Mini-4B-Instruct.Q2_K.gguf   |  3 ++
 nvidia.Nemotron-Mini-4B-Instruct.Q3_K_L.gguf |  3 ++
 nvidia.Nemotron-Mini-4B-Instruct.Q3_K_M.gguf |  3 ++
 nvidia.Nemotron-Mini-4B-Instruct.Q3_K_S.gguf |  3 ++
 nvidia.Nemotron-Mini-4B-Instruct.Q4_K_M.gguf |  3 ++
 nvidia.Nemotron-Mini-4B-Instruct.Q4_K_S.gguf |  3 ++
 nvidia.Nemotron-Mini-4B-Instruct.Q5_K_M.gguf |  3 ++
 nvidia.Nemotron-Mini-4B-Instruct.Q5_K_S.gguf |  3 ++
 nvidia.Nemotron-Mini-4B-Instruct.Q6_K.gguf   |  3 ++
 nvidia.Nemotron-Mini-4B-Instruct.Q8_0.gguf   |  3 ++
 nvidia.Nemotron-Mini-4B-Instruct.f16.gguf    |  3 ++
 13 files changed, 99 insertions(+)
 create mode 100644 .gitattributes
 create mode 100644 README.md
 create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q2_K.gguf
 create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q3_K_L.gguf
 create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q3_K_M.gguf
 create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q3_K_S.gguf
 create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q4_K_M.gguf
 create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q4_K_S.gguf
 create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q5_K_M.gguf
 create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q5_K_S.gguf
 create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q6_K.gguf
 create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q8_0.gguf
 create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.f16.gguf

diff --git a/.gitattributes b/.gitattributes
new file mode 100644
index 0000000..28d1df0
--- /dev/null
+++ b/.gitattributes
@@ -0,0 +1,46 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+nvidia.Nemotron-Mini-4B-Instruct.f16.gguf filter=lfs diff=lfs merge=lfs -text
+nvidia.Nemotron-Mini-4B-Instruct.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
+nvidia.Nemotron-Mini-4B-Instruct.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+nvidia.Nemotron-Mini-4B-Instruct.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+nvidia.Nemotron-Mini-4B-Instruct.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+nvidia.Nemotron-Mini-4B-Instruct.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
+nvidia.Nemotron-Mini-4B-Instruct.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
+nvidia.Nemotron-Mini-4B-Instruct.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+nvidia.Nemotron-Mini-4B-Instruct.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
+nvidia.Nemotron-Mini-4B-Instruct.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+nvidia.Nemotron-Mini-4B-Instruct.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
diff --git a/README.md b/README.md
new file mode 100644
index 0000000..2ac609b
--- /dev/null
+++ b/README.md
@@ -0,0 +1,20 @@
+---
+base_model:
+- nvidia/Nemotron-Mini-4B-Instruct
+pipeline_tag: text-generation
+---
+
+[<img src="https://raw.githubusercontent.com/csabakecskemeti/devquasar/main/dq_logo_black-transparent.png" width="200"/>](https://devquasar.com)
+
+Quantized version of: [nvidia/Nemotron-Mini-4B-Instruct](https://huggingface.co/nvidia/Nemotron-Mini-4B-Instruct)
+
+'Make knowledge free for everyone'
+
+<p align="center">
+  Made with <br>
+  <a href="https://www.civo.com/" target="_blank">
+    <img src="https://www.civo.com/assets/public/brand-assets/civo-logo-colour-60cc1622dedf346f7afde1fff760523f731b0aac106a5465af98ff4073114b74.svg" width="100"/>
+  </a>
+</p>
+
+<a href='https://ko-fi.com/L4L416YX7C' target='_blank'><img height='36' style='border:0px;height:36px;' src='https://storage.ko-fi.com/cdn/kofi6.png?v=6' border='0' alt='Buy Me a Coffee at ko-fi.com' /></a>
diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q2_K.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q2_K.gguf
new file mode 100644
index 0000000..800da4f
--- /dev/null
+++ b/nvidia.Nemotron-Mini-4B-Instruct.Q2_K.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:51563c7c8054df2dd1891c77f155be7d06b88e24415ef6d3941d33d93a88d490
+size 1902795424
diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_L.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_L.gguf
new file mode 100644
index 0000000..d096523
--- /dev/null
+++ b/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_L.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e23ab1c6101753a373501143602a1451d27fee4adcaf90f9dbfc7968949fbf0c
+size 2452953760
diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_M.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_M.gguf
new file mode 100644
index 0000000..dc86164
--- /dev/null
+++ b/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fce3ae3d0460dfb877826722173251a0a7ce5694af455b91ecb9facf2517e5d4
+size 2297240224
diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_S.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_S.gguf
new file mode 100644
index 0000000..8fd81dd
--- /dev/null
+++ b/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_S.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1ea3f049aea16041b5ced94d34e673812c78ee9266410c8871bc45958c6cae41
+size 2115574432
diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q4_K_M.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q4_K_M.gguf
new file mode 100644
index 0000000..f8c4ccd
--- /dev/null
+++ b/nvidia.Nemotron-Mini-4B-Instruct.Q4_K_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:725856aa1e3f0a1381dc7416e2aaa88fb12221f14d54a529f835b779f4067311
+size 2697386656
diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q4_K_S.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q4_K_S.gguf
new file mode 100644
index 0000000..1327f11
--- /dev/null
+++ b/nvidia.Nemotron-Mini-4B-Instruct.Q4_K_S.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fd00fb19c250c98cd40210af6603d60ba5b5e7d612c31501e0e0802beb575e99
+size 2583354016
diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q5_K_M.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q5_K_M.gguf
new file mode 100644
index 0000000..a37356b
--- /dev/null
+++ b/nvidia.Nemotron-Mini-4B-Instruct.Q5_K_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8526c42527567d1ae1b82b3ffb4a6908774a3e3701bde68d0bec7e603aaa7090
+size 3059931808
diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q5_K_S.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q5_K_S.gguf
new file mode 100644
index 0000000..c4d881c
--- /dev/null
+++ b/nvidia.Nemotron-Mini-4B-Instruct.Q5_K_S.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c2df7ce1e20886eac8a103ad0ab6df09478787e71e553ec9761a49962e85d7c7
+size 2993085088
diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q6_K.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q6_K.gguf
new file mode 100644
index 0000000..17e5fc9
--- /dev/null
+++ b/nvidia.Nemotron-Mini-4B-Instruct.Q6_K.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2e6a922e2e89510ab82bcdb85cde5929e5db245a3eceb09d953dbfd031c83e6a
+size 3445136032
diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q8_0.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q8_0.gguf
new file mode 100644
index 0000000..45f04f0
--- /dev/null
+++ b/nvidia.Nemotron-Mini-4B-Instruct.Q8_0.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9474cff58734f261077bca9720e4251b13a10ccc2f13efefee44182c8d9dd75a
+size 4459928224
diff --git a/nvidia.Nemotron-Mini-4B-Instruct.f16.gguf b/nvidia.Nemotron-Mini-4B-Instruct.f16.gguf
new file mode 100644
index 0000000..dffcc3c
--- /dev/null
+++ b/nvidia.Nemotron-Mini-4B-Instruct.f16.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1cbb50185b180012ad842c81eb0da2b8dfd494d52ea38f47addecc7f3deba502
+size 8388156064