From 04aff2c528129b40e4b292b40720019b26f0f818 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Thu, 7 May 2026 06:42:18 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mmnga-o/llm-jp-4-8b-thinking-gguf Source: Original Platform --- .gitattributes | 49 +++++++++++++++++++++++++++++ README.md | 27 ++++++++++++++++ llm-jp-4-8b-thinking-IQ3_M.gguf | 3 ++ llm-jp-4-8b-thinking-IQ4_NL.gguf | 3 ++ llm-jp-4-8b-thinking-IQ4_XS.gguf | 3 ++ llm-jp-4-8b-thinking-MXFP4_MOE.gguf | 3 ++ llm-jp-4-8b-thinking-Q3_K_L.gguf | 3 ++ llm-jp-4-8b-thinking-Q3_K_M.gguf | 3 ++ llm-jp-4-8b-thinking-Q4_0.gguf | 3 ++ llm-jp-4-8b-thinking-Q4_K_M.gguf | 3 ++ llm-jp-4-8b-thinking-Q4_K_S.gguf | 3 ++ llm-jp-4-8b-thinking-Q5_0.gguf | 3 ++ llm-jp-4-8b-thinking-Q5_K_M.gguf | 3 ++ llm-jp-4-8b-thinking-Q5_K_S.gguf | 3 ++ llm-jp-4-8b-thinking-Q6_K.gguf | 3 ++ llm-jp-4-8b-thinking-Q8_0.gguf | 3 ++ 16 files changed, 118 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 llm-jp-4-8b-thinking-IQ3_M.gguf create mode 100644 llm-jp-4-8b-thinking-IQ4_NL.gguf create mode 100644 llm-jp-4-8b-thinking-IQ4_XS.gguf create mode 100644 llm-jp-4-8b-thinking-MXFP4_MOE.gguf create mode 100644 llm-jp-4-8b-thinking-Q3_K_L.gguf create mode 100644 llm-jp-4-8b-thinking-Q3_K_M.gguf create mode 100644 llm-jp-4-8b-thinking-Q4_0.gguf create mode 100644 llm-jp-4-8b-thinking-Q4_K_M.gguf create mode 100644 llm-jp-4-8b-thinking-Q4_K_S.gguf create mode 100644 llm-jp-4-8b-thinking-Q5_0.gguf create mode 100644 llm-jp-4-8b-thinking-Q5_K_M.gguf create mode 100644 llm-jp-4-8b-thinking-Q5_K_S.gguf create mode 100644 llm-jp-4-8b-thinking-Q6_K.gguf create mode 100644 llm-jp-4-8b-thinking-Q8_0.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..d6284da --- /dev/null +++ b/.gitattributes @@ -0,0 +1,49 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-MXFP4_MOE.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +llm-jp-4-8b-thinking-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..478f32c --- /dev/null +++ b/README.md @@ -0,0 +1,27 @@ + +--- +license: apache-2.0 +language: +- ja +datasets: +- TFMC/imatrix-dataset-for-japanese-llm +base_model: +- llm-jp/llm-jp-4-8b-thinking +--- + +# llm-jp-4-8b-thinking-gguf +[llm-jpさんが公開しているllm-jp-4-8b-thinking](https://huggingface.co/llm-jp/llm-jp-4-8b-thinking)のggufフォーマット変換版です。 + +imatrixのデータは[TFMC/imatrix-dataset-for-japanese-llm](https://huggingface.co/datasets/TFMC/imatrix-dataset-for-japanese-llm)を使用して作成しました。 + +動作用にchat-templateをカスタマイズしていますので、実際の元モデルのchat-templateと異なる点にご注意ください + +## Usage + +``` +git clone https://github.com/ggml-org/llama.cpp.git +cd llama.cpp +cmake -B build -DGGML_CUDA=ON +cmake --build build --config Release +build/bin/llama-cli -m 'llm-jp-4-8b-thinking-gguf' -n 128 -c 128 -p 'あなたはプロの料理人です。レシピを教えて' -rea on +``` diff --git a/llm-jp-4-8b-thinking-IQ3_M.gguf b/llm-jp-4-8b-thinking-IQ3_M.gguf new file mode 100644 index 0000000..21dc155 --- /dev/null +++ b/llm-jp-4-8b-thinking-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13bf29e5191d5ba61eb3c1f9c5a071228ed71f21331978318536674c83f4349f +size 4131787840 diff --git a/llm-jp-4-8b-thinking-IQ4_NL.gguf b/llm-jp-4-8b-thinking-IQ4_NL.gguf new file mode 100644 index 0000000..a424505 --- /dev/null +++ b/llm-jp-4-8b-thinking-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c781c132a3dafb7300f80ec2fbf27c4d227164cb49b22ab95d0b3e45fc0c7e7 +size 5062136896 diff --git a/llm-jp-4-8b-thinking-IQ4_XS.gguf b/llm-jp-4-8b-thinking-IQ4_XS.gguf new file mode 100644 index 0000000..e98d8b2 --- /dev/null +++ b/llm-jp-4-8b-thinking-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4613e97342612dfe587300042a2b3242c6465e18ff61e33a24df75b7deee112d +size 4823061568 diff --git a/llm-jp-4-8b-thinking-MXFP4_MOE.gguf b/llm-jp-4-8b-thinking-MXFP4_MOE.gguf new file mode 100644 index 0000000..d24382e --- /dev/null +++ b/llm-jp-4-8b-thinking-MXFP4_MOE.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5293041cdca71b98dda2a7c746827e8bf0347d311bcd180ac5b4b231c53288d3 +size 9132708672 diff --git a/llm-jp-4-8b-thinking-Q3_K_L.gguf b/llm-jp-4-8b-thinking-Q3_K_L.gguf new file mode 100644 index 0000000..bcf08fd --- /dev/null +++ b/llm-jp-4-8b-thinking-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ce2a37c33d748124dc9a8499afa15e603c82b591f9148484db2fd50647f099 +size 4668920640 diff --git a/llm-jp-4-8b-thinking-Q3_K_M.gguf b/llm-jp-4-8b-thinking-Q3_K_M.gguf new file mode 100644 index 0000000..d3d20e3 --- /dev/null +++ b/llm-jp-4-8b-thinking-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddc762ca4dcb2098c79612b125d3cd42b75630e782237bd68f74095d5ebc831c +size 4365882176 diff --git a/llm-jp-4-8b-thinking-Q4_0.gguf b/llm-jp-4-8b-thinking-Q4_0.gguf new file mode 100644 index 0000000..6107bce --- /dev/null +++ b/llm-jp-4-8b-thinking-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83fec51871cae5afb731659419f7145024876ee63afbc82d492fa1c553a6334b +size 5045359424 diff --git a/llm-jp-4-8b-thinking-Q4_K_M.gguf b/llm-jp-4-8b-thinking-Q4_K_M.gguf new file mode 100644 index 0000000..b4b9009 --- /dev/null +++ b/llm-jp-4-8b-thinking-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b4db3d11ba95fc821aca556fa801c1c2cb9c32b96deb2c7f7c04ff612cf784c +size 5304881984 diff --git a/llm-jp-4-8b-thinking-Q4_K_S.gguf b/llm-jp-4-8b-thinking-Q4_K_S.gguf new file mode 100644 index 0000000..1874000 --- /dev/null +++ b/llm-jp-4-8b-thinking-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eaf2321cfab47bc3a1becfc96308f4829e79f96f12da82668946a27ad8d0df0 +size 5076816704 diff --git a/llm-jp-4-8b-thinking-Q5_0.gguf b/llm-jp-4-8b-thinking-Q5_0.gguf new file mode 100644 index 0000000..0770222 --- /dev/null +++ b/llm-jp-4-8b-thinking-Q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f51d3ec435ccf784ab0fb916d2d22025791a50ad6ee987aa56c693d57159b0f9 +size 6018437952 diff --git a/llm-jp-4-8b-thinking-Q5_K_M.gguf b/llm-jp-4-8b-thinking-Q5_K_M.gguf new file mode 100644 index 0000000..53bb923 --- /dev/null +++ b/llm-jp-4-8b-thinking-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0028f354eb518354da2fc05bdad093e8375129c05051977618f86766b4e41a8a +size 6152131392 diff --git a/llm-jp-4-8b-thinking-Q5_K_S.gguf b/llm-jp-4-8b-thinking-Q5_K_S.gguf new file mode 100644 index 0000000..7fe42df --- /dev/null +++ b/llm-jp-4-8b-thinking-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aee36e314fb3b1f7d7a4b4db2cc185cfcfc9c01886f7917d08951fbbf19909fd +size 6018437952 diff --git a/llm-jp-4-8b-thinking-Q6_K.gguf b/llm-jp-4-8b-thinking-Q6_K.gguf new file mode 100644 index 0000000..241544a --- /dev/null +++ b/llm-jp-4-8b-thinking-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2b57817aad725665a85064b1056f3e88770a614cfc9bdf51655d71d3b66445c +size 7052333888 diff --git a/llm-jp-4-8b-thinking-Q8_0.gguf b/llm-jp-4-8b-thinking-Q8_0.gguf new file mode 100644 index 0000000..3b531d0 --- /dev/null +++ b/llm-jp-4-8b-thinking-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66ae2df9143e6f3611353de2f09dc6ec30c75d0fbc56ae772791032ef8fd0914 +size 9132708672