From 800e83ed9046bc6207ae8fa37a4ddf531b22cb0e Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sun, 21 Jun 2026 11:41:13 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: QuantFactory/AI-Sweden-Llama-3-8B-Instruct-GGUF Source: Original Platform --- .gitattributes | 49 +++++++++++++++++++++ Llama-3-8B-Instruct.Q2_K.gguf | 3 ++ Llama-3-8B-Instruct.Q3_K_L.gguf | 3 ++ Llama-3-8B-Instruct.Q3_K_M.gguf | 3 ++ Llama-3-8B-Instruct.Q3_K_S.gguf | 3 ++ Llama-3-8B-Instruct.Q4_0.gguf | 3 ++ Llama-3-8B-Instruct.Q4_1.gguf | 3 ++ Llama-3-8B-Instruct.Q4_K_M.gguf | 3 ++ Llama-3-8B-Instruct.Q4_K_S.gguf | 3 ++ Llama-3-8B-Instruct.Q5_0.gguf | 3 ++ Llama-3-8B-Instruct.Q5_1.gguf | 3 ++ Llama-3-8B-Instruct.Q5_K_M.gguf | 3 ++ Llama-3-8B-Instruct.Q5_K_S.gguf | 3 ++ Llama-3-8B-Instruct.Q6_K.gguf | 3 ++ Llama-3-8B-Instruct.Q8_0.gguf | 3 ++ README.md | 77 +++++++++++++++++++++++++++++++++ configuration.json | 1 + 17 files changed, 169 insertions(+) create mode 100644 .gitattributes create mode 100644 Llama-3-8B-Instruct.Q2_K.gguf create mode 100644 Llama-3-8B-Instruct.Q3_K_L.gguf create mode 100644 Llama-3-8B-Instruct.Q3_K_M.gguf create mode 100644 Llama-3-8B-Instruct.Q3_K_S.gguf create mode 100644 Llama-3-8B-Instruct.Q4_0.gguf create mode 100644 Llama-3-8B-Instruct.Q4_1.gguf create mode 100644 Llama-3-8B-Instruct.Q4_K_M.gguf create mode 100644 Llama-3-8B-Instruct.Q4_K_S.gguf create mode 100644 Llama-3-8B-Instruct.Q5_0.gguf create mode 100644 Llama-3-8B-Instruct.Q5_1.gguf create mode 100644 Llama-3-8B-Instruct.Q5_K_M.gguf create mode 100644 Llama-3-8B-Instruct.Q5_K_S.gguf create mode 100644 Llama-3-8B-Instruct.Q6_K.gguf create mode 100644 Llama-3-8B-Instruct.Q8_0.gguf create mode 100644 README.md create mode 100644 configuration.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..4bca19e --- /dev/null +++ b/.gitattributes @@ -0,0 +1,49 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q5_0.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q5_1.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Llama-3-8B-Instruct.Q4_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Llama-3-8B-Instruct.Q2_K.gguf b/Llama-3-8B-Instruct.Q2_K.gguf new file mode 100644 index 0000000..986831a --- /dev/null +++ b/Llama-3-8B-Instruct.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:027c7bb20541b873dcf924b78ed68b1408ac14754c3d1d8c82cb03521e7696df +size 3179131136 diff --git a/Llama-3-8B-Instruct.Q3_K_L.gguf b/Llama-3-8B-Instruct.Q3_K_L.gguf new file mode 100644 index 0000000..5ffaa17 --- /dev/null +++ b/Llama-3-8B-Instruct.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27397186a69b50cf71281a5b9630eea6d7275b313acb5192d904508b4a3eef1f +size 4321956096 diff --git a/Llama-3-8B-Instruct.Q3_K_M.gguf b/Llama-3-8B-Instruct.Q3_K_M.gguf new file mode 100644 index 0000000..213eeae --- /dev/null +++ b/Llama-3-8B-Instruct.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85f3be4ee82a3a784ec3a5ae442e4c71fbf361177ea9950a386371f99fa0d5c1 +size 4018917632 diff --git a/Llama-3-8B-Instruct.Q3_K_S.gguf b/Llama-3-8B-Instruct.Q3_K_S.gguf new file mode 100644 index 0000000..3b30a68 --- /dev/null +++ b/Llama-3-8B-Instruct.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbe2dd4f35478be6eb0efe88debd88e8bb381f579cebd7466150b435552c09b8 +size 3664498944 diff --git a/Llama-3-8B-Instruct.Q4_0.gguf b/Llama-3-8B-Instruct.Q4_0.gguf new file mode 100644 index 0000000..c948f9d --- /dev/null +++ b/Llama-3-8B-Instruct.Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54531973f4bb8c1d4e551650c61c223f9d8780b782b2abf90e690c7e096c7867 +size 4661211392 diff --git a/Llama-3-8B-Instruct.Q4_1.gguf b/Llama-3-8B-Instruct.Q4_1.gguf new file mode 100644 index 0000000..e71a76c --- /dev/null +++ b/Llama-3-8B-Instruct.Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c396b42bd6e9b2368df15992bd21bac911b847a9015a7ef6b113b49a1d46149 +size 5130252544 diff --git a/Llama-3-8B-Instruct.Q4_K_M.gguf b/Llama-3-8B-Instruct.Q4_K_M.gguf new file mode 100644 index 0000000..d59df26 --- /dev/null +++ b/Llama-3-8B-Instruct.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79fa6a2e5f64b9d249d3f17fd49320c190b791d82dbb09c4c87ba0809549a554 +size 4920733952 diff --git a/Llama-3-8B-Instruct.Q4_K_S.gguf b/Llama-3-8B-Instruct.Q4_K_S.gguf new file mode 100644 index 0000000..8a57e8a --- /dev/null +++ b/Llama-3-8B-Instruct.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e57b076a74d2b3cccde2f2e4c3017ab08357330789ada55213b51f2972dab690 +size 4692668672 diff --git a/Llama-3-8B-Instruct.Q5_0.gguf b/Llama-3-8B-Instruct.Q5_0.gguf new file mode 100644 index 0000000..0c5ad54 --- /dev/null +++ b/Llama-3-8B-Instruct.Q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ee37c010296b958a1249f5b9448b271e9d0a3a7c35b6956ebb297187649bbbd +size 5599293696 diff --git a/Llama-3-8B-Instruct.Q5_1.gguf b/Llama-3-8B-Instruct.Q5_1.gguf new file mode 100644 index 0000000..d50b55d --- /dev/null +++ b/Llama-3-8B-Instruct.Q5_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e7925ebeea2449ebe7abc7f827c8f5c35c58e33bbc4aea479f40e1d017c430f +size 6068334848 diff --git a/Llama-3-8B-Instruct.Q5_K_M.gguf b/Llama-3-8B-Instruct.Q5_K_M.gguf new file mode 100644 index 0000000..3bef8ce --- /dev/null +++ b/Llama-3-8B-Instruct.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4802db9eb6a446758f8b17f0565fc0c8989df03a6d09e20ffa7d060e00391d36 +size 5732987136 diff --git a/Llama-3-8B-Instruct.Q5_K_S.gguf b/Llama-3-8B-Instruct.Q5_K_S.gguf new file mode 100644 index 0000000..b37934c --- /dev/null +++ b/Llama-3-8B-Instruct.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b08d3c40541ccc059cf2c9c8a0c223db443b1f569282cbdd256e2a648bac63 +size 5599293696 diff --git a/Llama-3-8B-Instruct.Q6_K.gguf b/Llama-3-8B-Instruct.Q6_K.gguf new file mode 100644 index 0000000..d144abf --- /dev/null +++ b/Llama-3-8B-Instruct.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27a9c5e97612c7640db6f6e8c8d0741eee148087591cf17b85f8361ec3e37851 +size 6596006144 diff --git a/Llama-3-8B-Instruct.Q8_0.gguf b/Llama-3-8B-Instruct.Q8_0.gguf new file mode 100644 index 0000000..83178e9 --- /dev/null +++ b/Llama-3-8B-Instruct.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:944ba761cb4b40111dd808b979f11ddf5e5f25358e38d1a086a666f529adb273 +size 8540770560 diff --git a/README.md b/README.md new file mode 100644 index 0000000..f35e47a --- /dev/null +++ b/README.md @@ -0,0 +1,77 @@ +--- +license: apache-2.0 +datasets: teknium/OpenHermes-2.5 +base_model: AI-Sweden-Models/Llama-3-8B-instruct +pipeline_tag: text-generation +--- + +# QuantFactory/AI-Sweden-Llama-3-8B-Instruct-GGUF +This is quantized version of [AI-Sweden-Models/Llama-3-8B-instruct](https://huggingface.co/AI-Sweden-Models/Llama-3-8B-instruct) created suing llama.cpp + +# Model Description + +# Checkpoint 1 + +## Training setup +The training was perfomed on the [LUMI supercomputer](https://lumi-supercomputer.eu/) within the [DeployAI EU project](https://www.ai.se/en/project/deployai). +Based of the base model [AI-Sweden-Models/Llama-3-8B](https://huggingface.co/AI-Sweden-Models/Llama-3-8B). + +## Dataset +A data recipe by: [42 Labs](https://huggingface.co/four-two-labs) +![](https://huggingface.co/AI-Sweden-Models/Llama-3-8B-instruct/resolve/main/42logo.png?download=true) + +## How to use + +```python +import transformers +import torch + +model_id = "AI-Sweden-Models/Llama-3-8B-instruct" + +pipeline = transformers.pipeline( + "text-generation", + model=model_id, + model_kwargs={"torch_dtype": torch.bfloat16}, + device_map="auto", +) + +messages = [ + {"role": "system", "content": "Du är en hjälpsam assistant som svarar klokt och vänligt."}, + {"role": "user", "content": "Hur gör man pannkakor? Och vad behöver man handla? Undrar också vad 5+6 är.."}, +] + +terminators = [ + pipeline.tokenizer.eos_token_id, + pipeline.tokenizer.convert_tokens_to_ids("<|eot_id|>") +] + +outputs = pipeline( + messages, + max_new_tokens=256, + eos_token_id=terminators, + do_sample=True, + temperature=0.6, + top_p=0.9, +) +print(outputs[0]["generated_text"][-1]) +``` +```python +>>> "För att göra pannkakor behöver du följande ingredienser: +- 1 kopp vetemjöl +- 1 tesked bakpulver +- 1/4 tesked salt +- 1 kopp mjölk +- 1 stort ägg +- 2 matskedar smält smör eller olja + +För att börja, blanda vetemjölet, bakpulvret och saltet i en bunke. I en annan skål, vispa ihop mjölken, ägget och smöret eller oljan. +Tillsätt de våta ingredienserna till de torra ingredienserna och blanda tills det är väl blandat. +Låt smeten vila i cirka 10 minuter. + +För att göra pannkakorna, värm en non-stick-panna eller stekpanna över medelvärme. +När den är varm, häll smeten på pannan och grädda tills kanterna börjar torka ut och toppen är fast. +Vänd pannkakan med en stekspade och grädda den andra sidan tills den är gyllenbrun. +Upprepa med resten av smeten. + +När det gäller 5+6 är svaret 11." +``` \ No newline at end of file diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file