commit c70d87425cb0689fad5b86ab0613aa3c9e523bc0 Author: ModelHub XC Date: Sun Apr 12 19:46:54 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: DevQuasar/nvidia.Llama-3.1-Nemotron-Nano-8B-v1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..4ab4b78 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,46 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +nvidia.Llama-3.1-Nemotron-Nano-8B-v1.f16.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..3021965 --- /dev/null +++ b/README.md @@ -0,0 +1,20 @@ +--- +base_model: +- nvidia/Llama-3.1-Nemotron-Nano-8B-v1 +pipeline_tag: text-generation +--- + +[](https://devquasar.com) + +Quantized version of: [nvidia/Llama-3.1-Nemotron-Nano-8B-v1](https://huggingface.co/nvidia/Llama-3.1-Nemotron-Nano-8B-v1) + +'Make knowledge free for everyone' + +

+ Made with
+ + + +

+ +Buy Me a Coffee at ko-fi.com diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file diff --git a/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q2_K.gguf b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q2_K.gguf new file mode 100644 index 0000000..22b992e --- /dev/null +++ b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88ad69a0dd7cb44230c668db18fffdfa56b9a64f166e46b039f47d2d68a65eda +size 3179133728 diff --git a/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q3_K_L.gguf b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q3_K_L.gguf new file mode 100644 index 0000000..08dcdd9 --- /dev/null +++ b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e51884058f734c63c4202c2429b289785ab0bb55112121e0ec23014a1a20527 +size 4321958688 diff --git a/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q3_K_M.gguf b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q3_K_M.gguf new file mode 100644 index 0000000..f0259d0 --- /dev/null +++ b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b12515f8cde84968f846062ed7f445f5c4b5f70eaeb06fa1acaf08685b25720 +size 4018920224 diff --git a/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q3_K_S.gguf b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q3_K_S.gguf new file mode 100644 index 0000000..30ec526 --- /dev/null +++ b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e11689f828862339ff7fe70b4adb29e816d1f0c28ba16bf80e9156ddeab4c46 +size 3664501536 diff --git a/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q4_K_M.gguf b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q4_K_M.gguf new file mode 100644 index 0000000..8fa76bd --- /dev/null +++ b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4406a891bc37c4c4af8339d5f934f26f6db1db14070e5441a5a88bf29d8fa40 +size 4920736544 diff --git a/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q4_K_S.gguf b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q4_K_S.gguf new file mode 100644 index 0000000..2c9f4c9 --- /dev/null +++ b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6c90d8f1a63b8d985e4ca1002817b56c2e6de537e7fa0abd1fa81e0da0fc628 +size 4692671264 diff --git a/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q5_K_M.gguf b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q5_K_M.gguf new file mode 100644 index 0000000..6c883e2 --- /dev/null +++ b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e31b6bcef837ba1b8bc6e9e680bbb465ee80466a467a7eb1f6458ed6f7b3a75d +size 5732989728 diff --git a/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q5_K_S.gguf b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q5_K_S.gguf new file mode 100644 index 0000000..68e6794 --- /dev/null +++ b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e93656aaab7d762ac262835d74e98018a8ed7655bfc6890665083ce21393240 +size 5599296288 diff --git a/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q6_K.gguf b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q6_K.gguf new file mode 100644 index 0000000..3c45790 --- /dev/null +++ b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf99105270f10da919182ee6bd8748e0d3f95d0066458da716a6620a1c307c3 +size 6596008736 diff --git a/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q8_0.gguf b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q8_0.gguf new file mode 100644 index 0000000..be7c96b --- /dev/null +++ b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e341354949756ba20fd402be0764f4bf75f0833fcdcd6ade5b583df998c8214e +size 8540773152 diff --git a/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.f16.gguf b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.f16.gguf new file mode 100644 index 0000000..71ffeee --- /dev/null +++ b/nvidia.Llama-3.1-Nemotron-Nano-8B-v1.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a7d697ad1d5ba747bd108d2c398ffd87960d2988906b1ad7c1e106a5b49810d +size 16068893472