From 8ee8041f778ffa70cd3c2ce3ae858b5f5835e758 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Thu, 21 May 2026 20:04:17 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF Source: Original Platform --- .gitattributes | 59 ++++++++++++ ...-Opus-High-Reasoning-Distill.i1-IQ1_M.gguf | 3 + ...-Opus-High-Reasoning-Distill.i1-IQ1_S.gguf | 3 + ...-Opus-High-Reasoning-Distill.i1-IQ2_M.gguf | 3 + ...-Opus-High-Reasoning-Distill.i1-IQ2_S.gguf | 3 + ...Opus-High-Reasoning-Distill.i1-IQ2_XS.gguf | 3 + ...pus-High-Reasoning-Distill.i1-IQ2_XXS.gguf | 3 + ...-Opus-High-Reasoning-Distill.i1-IQ3_M.gguf | 3 + ...-Opus-High-Reasoning-Distill.i1-IQ3_S.gguf | 3 + ...Opus-High-Reasoning-Distill.i1-IQ3_XS.gguf | 3 + ...pus-High-Reasoning-Distill.i1-IQ3_XXS.gguf | 3 + ...Opus-High-Reasoning-Distill.i1-IQ4_NL.gguf | 3 + ...Opus-High-Reasoning-Distill.i1-IQ4_XS.gguf | 3 + ...5-Opus-High-Reasoning-Distill.i1-Q2_K.gguf | 3 + ...Opus-High-Reasoning-Distill.i1-Q2_K_S.gguf | 3 + ...Opus-High-Reasoning-Distill.i1-Q3_K_L.gguf | 3 + ...Opus-High-Reasoning-Distill.i1-Q3_K_M.gguf | 3 + ...Opus-High-Reasoning-Distill.i1-Q3_K_S.gguf | 3 + ...5-Opus-High-Reasoning-Distill.i1-Q4_0.gguf | 3 + ...5-Opus-High-Reasoning-Distill.i1-Q4_1.gguf | 3 + ...Opus-High-Reasoning-Distill.i1-Q4_K_M.gguf | 3 + ...Opus-High-Reasoning-Distill.i1-Q4_K_S.gguf | 3 + ...Opus-High-Reasoning-Distill.i1-Q5_K_M.gguf | 3 + ...Opus-High-Reasoning-Distill.i1-Q5_K_S.gguf | 3 + ...5-Opus-High-Reasoning-Distill.i1-Q6_K.gguf | 3 + ...5-Opus-High-Reasoning-Distill.imatrix.gguf | 3 + README.md | 92 +++++++++++++++++++ 27 files changed, 226 insertions(+) create mode 100644 .gitattributes create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ1_M.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ1_S.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_M.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_S.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_XS.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_XXS.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_M.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_S.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_XS.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_XXS.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ4_NL.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ4_XS.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q2_K.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q2_K_S.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_L.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_M.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_S.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_0.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_1.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_K_M.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_K_S.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q5_K_M.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q5_K_S.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q6_K.gguf create mode 100644 Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.imatrix.gguf create mode 100644 README.md diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..50200bd --- /dev/null +++ b/.gitattributes @@ -0,0 +1,59 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.imatrix.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ1_M.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ1_M.gguf new file mode 100644 index 0000000..d2092b2 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f970d75b2c98b2e4135db4279a5382b15971a73b2f96a485cc7c269e79e6c1eb +size 3849657920 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ1_S.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ1_S.gguf new file mode 100644 index 0000000..98ba3d9 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f91404ef61fa8e5cd3c1bd769b6ca338b9c69963a4ed4bcd269ecd3d2fcd18d +size 3579936320 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_M.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_M.gguf new file mode 100644 index 0000000..66f8b6e --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c185ca7ddfa5fab389ffe8dbb416b92cbceeb8a8e5d24365b64aa50bc2f2c7e +size 5322943040 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_S.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_S.gguf new file mode 100644 index 0000000..dec8c43 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e70e58d0da04d85bc3f418c523f06f5b7b1872aa0c6bfcc754f0cc4e3228507 +size 4963314240 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_XS.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_XS.gguf new file mode 100644 index 0000000..871236a --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ce1d0f0080c71f3d4921d1f88bb67a5ffefa6ef4cde110deb7417361094301d +size 4691590720 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_XXS.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..4436ce6 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98cea862d6b956b44705c27e9c5a0a7d0d729af82883efc5daf486fe3cccb0c9 +size 4299193920 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_M.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_M.gguf new file mode 100644 index 0000000..143cc4f --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a0a0c8d37e91cc2a8f5f361663e3954c81634baf890f98cad70ad97653ee80 +size 6883411520 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_S.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_S.gguf new file mode 100644 index 0000000..abc928e --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b79dc64719f1d8ca1a1336c9b03bab65d609a4990afc4908d8ba1a362decf2be +size 6684960320 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_XS.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_XS.gguf new file mode 100644 index 0000000..3a33462 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa692b924f44bd403b240994c39bd22165c41d8b86493c1d1dcdc4510790583 +size 6375302720 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_XXS.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..ad0638b --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce14df4d55dfd50ddf13301fab344577b3f70d2664cea7f9bbcffdc4967647a1 +size 5942667840 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ4_NL.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ4_NL.gguf new file mode 100644 index 0000000..3175251 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fa67d08c8d64d42148435dbc0b91fb716081898fe43c8cc571b4f59f54d0dc3 +size 8541364800 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ4_XS.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ4_XS.gguf new file mode 100644 index 0000000..148ea79 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44317b29b95388bfc4912aa89942be812a24fcb140a50bf10c4fb1a98c783545 +size 8110731840 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q2_K.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q2_K.gguf new file mode 100644 index 0000000..3457608 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:384758e8f82a2451669b1fcf78b68372207de1682e64262c1d057057f9040a8e +size 5753985600 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q2_K_S.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q2_K_S.gguf new file mode 100644 index 0000000..25763de --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82653b8424b472733811e2b450c9e6fe04b7484f7d4b9b8c3fba2b7144d1e792 +size 5389851200 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_L.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_L.gguf new file mode 100644 index 0000000..bce8418 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96df92e8cf72497aeed707122fc9409998a3fb9c4d99420cf25bf3f2c100b921 +size 7900653120 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_M.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_M.gguf new file mode 100644 index 0000000..56b3f76 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:236c3420945523b126aaa6116afe5a8c2638701c06b5886d43f2c3a13515957c +size 7321314880 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_S.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_S.gguf new file mode 100644 index 0000000..c8820b8 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d482f749e307e0145f0e287f8533225388cbe46e799c98858894257922702c4 +size 6657107520 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_0.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_0.gguf new file mode 100644 index 0000000..3cdd3bd --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7a134af591a7eb490e4e9384aa98c8a91d6bb297db6339a46ec0e32889fd5f +size 8543003200 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_1.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_1.gguf new file mode 100644 index 0000000..cab3469 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcb23a07533e7d112d71b1b47defa70cedeb81af2b994c6bad80014e671bca66 +size 9389523520 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_K_M.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_K_M.gguf new file mode 100644 index 0000000..bf2828c --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e6fa8ff6b330780e68c28a11dc460312390d6afbcf9cfec1a26fa1bcdf1ed4 +size 9001755200 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_K_S.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_K_S.gguf new file mode 100644 index 0000000..8aff6ea --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c50db3fbce555419695963af6d2b64ac6eb73420cd3c18f292ee8edd04934887 +size 8573477440 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q5_K_M.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q5_K_M.gguf new file mode 100644 index 0000000..abd3638 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:019f4690c6a55f0f36bf2d4f7896dc4c7329e625ca82fb454548498f1c3ac722 +size 10514571840 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q5_K_S.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q5_K_S.gguf new file mode 100644 index 0000000..0bfbd75 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a492a4b00370d49ea636c928d65aedfa1472cfd0e3642b91e4eb8e230586e43 +size 10263896640 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q6_K.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q6_K.gguf new file mode 100644 index 0000000..c7fa0bc --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0438fb67d61ebf17355eb965473a229194b4bfdd06d887875c883385c30a6bf3 +size 12121939520 diff --git a/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.imatrix.gguf b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.imatrix.gguf new file mode 100644 index 0000000..8112e57 --- /dev/null +++ b/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.imatrix.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49b37d15e6ef27c6da9397421b8fda24bc5b8a18f12a980600e16c7d825ec5e1 +size 7743552 diff --git a/README.md b/README.md new file mode 100644 index 0000000..ba1c7fb --- /dev/null +++ b/README.md @@ -0,0 +1,92 @@ +--- +base_model: TeichAI/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill +datasets: +- TeichAI/claude-4.5-opus-high-reasoning-250x +language: +- en +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- text-generation-inference +- transformers +- unsloth +- qwen3 +--- +## About + + + + + + + + + +weighted/imatrix quants of https://huggingface.co/TeichAI/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.imatrix.gguf) | imatrix | 0.1 | imatrix file (for creating your own quants) | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ1_S.gguf) | i1-IQ1_S | 3.7 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ1_M.gguf) | i1-IQ1_M | 3.9 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 4.4 | | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_XS.gguf) | i1-IQ2_XS | 4.8 | | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_S.gguf) | i1-IQ2_S | 5.1 | | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ2_M.gguf) | i1-IQ2_M | 5.4 | | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q2_K_S.gguf) | i1-Q2_K_S | 5.5 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q2_K.gguf) | i1-Q2_K | 5.9 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 6.0 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_XS.gguf) | i1-IQ3_XS | 6.5 | | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_S.gguf) | i1-Q3_K_S | 6.8 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_S.gguf) | i1-IQ3_S | 6.8 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ3_M.gguf) | i1-IQ3_M | 7.0 | | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_M.gguf) | i1-Q3_K_M | 7.4 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q3_K_L.gguf) | i1-Q3_K_L | 8.0 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ4_XS.gguf) | i1-IQ4_XS | 8.2 | | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-IQ4_NL.gguf) | i1-IQ4_NL | 8.6 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_0.gguf) | i1-Q4_0 | 8.6 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_K_S.gguf) | i1-Q4_K_S | 8.7 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_K_M.gguf) | i1-Q4_K_M | 9.1 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q4_1.gguf) | i1-Q4_1 | 9.5 | | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q5_K_S.gguf) | i1-Q5_K_S | 10.4 | | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q5_K_M.gguf) | i1-Q5_K_M | 10.6 | | +| [GGUF](https://huggingface.co/mradermacher/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill-i1-GGUF/resolve/main/Nemotron-Cascade-14B-Thinking-Claude-4.5-Opus-High-Reasoning-Distill.i1-Q6_K.gguf) | i1-Q6_K | 12.2 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + +