From 7913f83f512d8a2224eff26cc1803b81611ec00d Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sun, 21 Jun 2026 11:24:17 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: davidkim205/komt-llama2-7b-v1-ggml Source: Original Platform --- .gitattributes | 50 ++++++++++++++++++++++++++++++++++++++++++ README.md | 49 +++++++++++++++++++++++++++++++++++++++++ ggml-model-q2_k.gguf | 3 +++ ggml-model-q3_k.gguf | 3 +++ ggml-model-q3_k_l.gguf | 3 +++ ggml-model-q3_k_m.gguf | 3 +++ ggml-model-q4_0.gguf | 3 +++ ggml-model-q4_1.gguf | 3 +++ ggml-model-q4_k.gguf | 3 +++ ggml-model-q4_k_m.gguf | 3 +++ ggml-model-q4_k_s.gguf | 3 +++ ggml-model-q5_0.gguf | 3 +++ ggml-model-q5_1.gguf | 3 +++ ggml-model-q5_k.gguf | 3 +++ ggml-model-q5_k_m.gguf | 3 +++ ggml-model-q5_k_s.gguf | 3 +++ ggml-model-q8_0.gguf | 3 +++ 17 files changed, 144 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 ggml-model-q2_k.gguf create mode 100644 ggml-model-q3_k.gguf create mode 100644 ggml-model-q3_k_l.gguf create mode 100644 ggml-model-q3_k_m.gguf create mode 100644 ggml-model-q4_0.gguf create mode 100644 ggml-model-q4_1.gguf create mode 100644 ggml-model-q4_k.gguf create mode 100644 ggml-model-q4_k_m.gguf create mode 100644 ggml-model-q4_k_s.gguf create mode 100644 ggml-model-q5_0.gguf create mode 100644 ggml-model-q5_1.gguf create mode 100644 ggml-model-q5_k.gguf create mode 100644 ggml-model-q5_k_m.gguf create mode 100644 ggml-model-q5_k_s.gguf create mode 100644 ggml-model-q8_0.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..0975123 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,50 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +ggml-model-q2_k.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q3_k_l.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q3_k_m.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q3_k.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q4_0.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q4_1.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q4_k_m.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q4_k_s.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q4_k.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q5_0.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q5_1.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q5_k_m.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q5_k_s.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q5_k.gguf filter=lfs diff=lfs merge=lfs -text +ggml-model-q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..09b4bc2 --- /dev/null +++ b/README.md @@ -0,0 +1,49 @@ +--- +language: +- en +- ko +pipeline_tag: text-generation +inference: false +tags: +- facebook +- meta +- pytorch +- llama +- llama-2 +- llama-2-chat +license: apache-2.0 +--- +# komt : korean multi task instruction tuning model +![multi task instruction tuning.jpg](https://github.com/davidkim205/komt/assets/16680469/c7f6ade7-247e-4b62-a94f-47e19abea68e) + +Recently, due to the success of ChatGPT, numerous large language models have emerged in an attempt to catch up with ChatGPT's capabilities. +However, when it comes to Korean language performance, it has been observed that many models still struggle to provide accurate answers or generate Korean text effectively. +This study addresses these challenges by introducing a multi-task instruction technique that leverages supervised datasets from various tasks to create training data for Large Language Models (LLMs). + +## Model Details + +* **Model Developers** : davidkim(changyeon kim) +* **Repository** : https://github.com/davidkim205/komt +* **quant methods** : q4_0, q4_1, q5_0, q5_1, q2_k, q3_k, q3_k_m, q3_k_l, q4_k, q4_k_s, q4_k_m, q5_k, q5_k_s, q5_k_m, q8_0, q4_0 + + +## Training +Refer https://github.com/davidkim205/komt + +## Evaluation +For objective model evaluation, we initially used EleutherAI's lm-evaluation-harness but obtained unsatisfactory results. Consequently, we conducted evaluations using ChatGPT, a widely used model, as described in [Self-Alignment with Instruction Backtranslation](https://arxiv.org/pdf/2308.06502.pdf) and [Three Ways of Using Large Language Models to Evaluate Chat](https://arxiv.org/pdf/2308.06259.pdf) . + +| model | score | average(0~5) | percentage | +| --------------------------------------- | ------- | ------------ | ---------- | +| gpt-3.5-turbo(close) | 147 | 3.97 | 79.45% | +| naver Cue(close) | 140 | 3.78 | 75.67% | +| clova X(close) | 136 | 3.67 | 73.51% | +| WizardLM-13B-V1.2(open) | 96 | 2.59 | 51.89% | +| Llama-2-7b-chat-hf(open) | 67 | 1.81 | 36.21% | +| Llama-2-13b-chat-hf(open) | 73 | 1.91 | 38.37% | +| nlpai-lab/kullm-polyglot-12.8b-v2(open) | 70 | 1.89 | 37.83% | +| kfkas/Llama-2-ko-7b-Chat(open) | 96 | 2.59 | 51.89% | +| beomi/KoAlpaca-Polyglot-12.8B(open) | 100 | 2.70 | 54.05% | +| **komt-llama2-7b-v1 (open)(ours)** | **117** | **3.16** | **63.24%** | +| **komt-llama2-13b-v1 (open)(ours)** | **129** | **3.48** | **69.72%** | + diff --git a/ggml-model-q2_k.gguf b/ggml-model-q2_k.gguf new file mode 100644 index 0000000..897d183 --- /dev/null +++ b/ggml-model-q2_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a10a2b5e1f46377d63e34f884773050b411152bedf6913dd8a5cb8b9d6854355 +size 2825945408 diff --git a/ggml-model-q3_k.gguf b/ggml-model-q3_k.gguf new file mode 100644 index 0000000..5eeb349 --- /dev/null +++ b/ggml-model-q3_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b62e1ac9b2b708327617eb834e4531945dfb06f52cebac0a10c16275f430e56 +size 3298009824 diff --git a/ggml-model-q3_k_l.gguf b/ggml-model-q3_k_l.gguf new file mode 100644 index 0000000..4c3f0a7 --- /dev/null +++ b/ggml-model-q3_k_l.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac1368fa9f94ed9dba4a4593119a532bf07559ad15249530d4f0ac831ea0702 +size 3597116128 diff --git a/ggml-model-q3_k_m.gguf b/ggml-model-q3_k_m.gguf new file mode 100644 index 0000000..5eeb349 --- /dev/null +++ b/ggml-model-q3_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b62e1ac9b2b708327617eb834e4531945dfb06f52cebac0a10c16275f430e56 +size 3298009824 diff --git a/ggml-model-q4_0.gguf b/ggml-model-q4_0.gguf new file mode 100644 index 0000000..a66bcc7 --- /dev/null +++ b/ggml-model-q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ea0a0a4838639bcd8807c5bfc730cafe1f605bf954097f640a7d222ab9124cc +size 3825812736 diff --git a/ggml-model-q4_1.gguf b/ggml-model-q4_1.gguf new file mode 100644 index 0000000..e039c34 --- /dev/null +++ b/ggml-model-q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c65a6fd48a17b3724030684b943a76da8bc09d820e9093a397af877a248a183 +size 4238755328 diff --git a/ggml-model-q4_k.gguf b/ggml-model-q4_k.gguf new file mode 100644 index 0000000..51c9ad8 --- /dev/null +++ b/ggml-model-q4_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67c8f909269231e8340375f89259f44900abe9f734db4f8ed2df7b7d8eb9dc4a +size 4081009920 diff --git a/ggml-model-q4_k_m.gguf b/ggml-model-q4_k_m.gguf new file mode 100644 index 0000000..51c9ad8 --- /dev/null +++ b/ggml-model-q4_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67c8f909269231e8340375f89259f44900abe9f734db4f8ed2df7b7d8eb9dc4a +size 4081009920 diff --git a/ggml-model-q4_k_s.gguf b/ggml-model-q4_k_s.gguf new file mode 100644 index 0000000..6db95ef --- /dev/null +++ b/ggml-model-q4_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bd219e082dc39b27b8cd737d851d40afbbb80ca5e8ca08cce8db3892fa3343a +size 3856745728 diff --git a/ggml-model-q5_0.gguf b/ggml-model-q5_0.gguf new file mode 100644 index 0000000..507eeda --- /dev/null +++ b/ggml-model-q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bfe1803862eaf2b89723b5ae1d6b0bccd1add7bbadbcf103c31c895d6076696 +size 4651697920 diff --git a/ggml-model-q5_1.gguf b/ggml-model-q5_1.gguf new file mode 100644 index 0000000..b3d8106 --- /dev/null +++ b/ggml-model-q5_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f69311aa2757ec6ff849d0f639f3724054c0fa3e3bad66bff36ec65f59a30c8 +size 5064640512 diff --git a/ggml-model-q5_k.gguf b/ggml-model-q5_k.gguf new file mode 100644 index 0000000..1138647 --- /dev/null +++ b/ggml-model-q5_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea8777f3232227e478cfc3258bc17f1976dba0414810a99be488bc11d59b5f8 +size 4783163136 diff --git a/ggml-model-q5_k_m.gguf b/ggml-model-q5_k_m.gguf new file mode 100644 index 0000000..1138647 --- /dev/null +++ b/ggml-model-q5_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea8777f3232227e478cfc3258bc17f1976dba0414810a99be488bc11d59b5f8 +size 4783163136 diff --git a/ggml-model-q5_k_s.gguf b/ggml-model-q5_k_s.gguf new file mode 100644 index 0000000..3339a8d --- /dev/null +++ b/ggml-model-q5_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:967f62dfd3a934050bf979d23436dfc42490e13695cc5f1f8f6f6eee10b79488 +size 4651697920 diff --git a/ggml-model-q8_0.gguf b/ggml-model-q8_0.gguf new file mode 100644 index 0000000..6fb19b7 --- /dev/null +++ b/ggml-model-q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7dada8a0a06c87da5996688e35cd48743ad88840a929897b8cbc31b9c9dca21 +size 7161098464