From 1d2141706cc98f30ead07e3cb9fda177226c8f96 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Mon, 22 Jun 2026 05:21:17 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: DevQuasar-7/nvidia.Nemotron-Mini-4B-Instruct-GGUF Source: Original Platform --- .gitattributes | 46 ++++++++++++++++++++ README.md | 20 +++++++++ nvidia.Nemotron-Mini-4B-Instruct.Q2_K.gguf | 3 ++ nvidia.Nemotron-Mini-4B-Instruct.Q3_K_L.gguf | 3 ++ nvidia.Nemotron-Mini-4B-Instruct.Q3_K_M.gguf | 3 ++ nvidia.Nemotron-Mini-4B-Instruct.Q3_K_S.gguf | 3 ++ nvidia.Nemotron-Mini-4B-Instruct.Q4_K_M.gguf | 3 ++ nvidia.Nemotron-Mini-4B-Instruct.Q4_K_S.gguf | 3 ++ nvidia.Nemotron-Mini-4B-Instruct.Q5_K_M.gguf | 3 ++ nvidia.Nemotron-Mini-4B-Instruct.Q5_K_S.gguf | 3 ++ nvidia.Nemotron-Mini-4B-Instruct.Q6_K.gguf | 3 ++ nvidia.Nemotron-Mini-4B-Instruct.Q8_0.gguf | 3 ++ nvidia.Nemotron-Mini-4B-Instruct.f16.gguf | 3 ++ 13 files changed, 99 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q2_K.gguf create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q3_K_L.gguf create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q3_K_M.gguf create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q3_K_S.gguf create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q4_K_M.gguf create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q4_K_S.gguf create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q5_K_M.gguf create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q5_K_S.gguf create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q6_K.gguf create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.Q8_0.gguf create mode 100644 nvidia.Nemotron-Mini-4B-Instruct.f16.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..28d1df0 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,46 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +nvidia.Nemotron-Mini-4B-Instruct.f16.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Nemotron-Mini-4B-Instruct.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Nemotron-Mini-4B-Instruct.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Nemotron-Mini-4B-Instruct.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Nemotron-Mini-4B-Instruct.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Nemotron-Mini-4B-Instruct.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Nemotron-Mini-4B-Instruct.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Nemotron-Mini-4B-Instruct.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Nemotron-Mini-4B-Instruct.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Nemotron-Mini-4B-Instruct.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Nemotron-Mini-4B-Instruct.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..2ac609b --- /dev/null +++ b/README.md @@ -0,0 +1,20 @@ +--- +base_model: +- nvidia/Nemotron-Mini-4B-Instruct +pipeline_tag: text-generation +--- + +[](https://devquasar.com) + +Quantized version of: [nvidia/Nemotron-Mini-4B-Instruct](https://huggingface.co/nvidia/Nemotron-Mini-4B-Instruct) + +'Make knowledge free for everyone' + +

+ Made with
+ + + +

+ +Buy Me a Coffee at ko-fi.com diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q2_K.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q2_K.gguf new file mode 100644 index 0000000..800da4f --- /dev/null +++ b/nvidia.Nemotron-Mini-4B-Instruct.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51563c7c8054df2dd1891c77f155be7d06b88e24415ef6d3941d33d93a88d490 +size 1902795424 diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_L.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_L.gguf new file mode 100644 index 0000000..d096523 --- /dev/null +++ b/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e23ab1c6101753a373501143602a1451d27fee4adcaf90f9dbfc7968949fbf0c +size 2452953760 diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_M.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_M.gguf new file mode 100644 index 0000000..dc86164 --- /dev/null +++ b/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fce3ae3d0460dfb877826722173251a0a7ce5694af455b91ecb9facf2517e5d4 +size 2297240224 diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_S.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_S.gguf new file mode 100644 index 0000000..8fd81dd --- /dev/null +++ b/nvidia.Nemotron-Mini-4B-Instruct.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ea3f049aea16041b5ced94d34e673812c78ee9266410c8871bc45958c6cae41 +size 2115574432 diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q4_K_M.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q4_K_M.gguf new file mode 100644 index 0000000..f8c4ccd --- /dev/null +++ b/nvidia.Nemotron-Mini-4B-Instruct.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:725856aa1e3f0a1381dc7416e2aaa88fb12221f14d54a529f835b779f4067311 +size 2697386656 diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q4_K_S.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q4_K_S.gguf new file mode 100644 index 0000000..1327f11 --- /dev/null +++ b/nvidia.Nemotron-Mini-4B-Instruct.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd00fb19c250c98cd40210af6603d60ba5b5e7d612c31501e0e0802beb575e99 +size 2583354016 diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q5_K_M.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q5_K_M.gguf new file mode 100644 index 0000000..a37356b --- /dev/null +++ b/nvidia.Nemotron-Mini-4B-Instruct.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8526c42527567d1ae1b82b3ffb4a6908774a3e3701bde68d0bec7e603aaa7090 +size 3059931808 diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q5_K_S.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q5_K_S.gguf new file mode 100644 index 0000000..c4d881c --- /dev/null +++ b/nvidia.Nemotron-Mini-4B-Instruct.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2df7ce1e20886eac8a103ad0ab6df09478787e71e553ec9761a49962e85d7c7 +size 2993085088 diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q6_K.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q6_K.gguf new file mode 100644 index 0000000..17e5fc9 --- /dev/null +++ b/nvidia.Nemotron-Mini-4B-Instruct.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e6a922e2e89510ab82bcdb85cde5929e5db245a3eceb09d953dbfd031c83e6a +size 3445136032 diff --git a/nvidia.Nemotron-Mini-4B-Instruct.Q8_0.gguf b/nvidia.Nemotron-Mini-4B-Instruct.Q8_0.gguf new file mode 100644 index 0000000..45f04f0 --- /dev/null +++ b/nvidia.Nemotron-Mini-4B-Instruct.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9474cff58734f261077bca9720e4251b13a10ccc2f13efefee44182c8d9dd75a +size 4459928224 diff --git a/nvidia.Nemotron-Mini-4B-Instruct.f16.gguf b/nvidia.Nemotron-Mini-4B-Instruct.f16.gguf new file mode 100644 index 0000000..dffcc3c --- /dev/null +++ b/nvidia.Nemotron-Mini-4B-Instruct.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cbb50185b180012ad842c81eb0da2b8dfd494d52ea38f47addecc7f3deba502 +size 8388156064