From 2049a550392741898cf673e55f51190664c2cf82 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sun, 21 Jun 2026 08:16:13 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: llamafile-club/Meltemi-llamafile Source: Original Platform --- .gitattributes | 41 ++++++++++ Meltemi-7B-Instruct-v1.5-F16.gguf | 3 + Meltemi-7B-Instruct-v1.5-F16.llamafile | 3 + Meltemi-7B-Instruct-v1.5-Q8_0.gguf | 3 + Meltemi-7B-Instruct-v1.5-Q8_0.llamafile | 3 + README.md | 104 ++++++++++++++++++++++++ configuration.json | 1 + 7 files changed, 158 insertions(+) create mode 100644 .gitattributes create mode 100644 Meltemi-7B-Instruct-v1.5-F16.gguf create mode 100644 Meltemi-7B-Instruct-v1.5-F16.llamafile create mode 100644 Meltemi-7B-Instruct-v1.5-Q8_0.gguf create mode 100644 Meltemi-7B-Instruct-v1.5-Q8_0.llamafile create mode 100644 README.md create mode 100644 configuration.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..1bf0bfd --- /dev/null +++ b/.gitattributes @@ -0,0 +1,41 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +*.gguf filter=lfs diff=lfs merge=lfs -text +*.llamafile filter=lfs diff=lfs merge=lfs -text +Meltemi-7B-Instruct-v1.5-F16.gguf filter=lfs diff=lfs merge=lfs -text +Meltemi-7B-Instruct-v1.5-F16.llamafile filter=lfs diff=lfs merge=lfs -text +Meltemi-7B-Instruct-v1.5-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +Meltemi-7B-Instruct-v1.5-Q8_0.llamafile filter=lfs diff=lfs merge=lfs -text diff --git a/Meltemi-7B-Instruct-v1.5-F16.gguf b/Meltemi-7B-Instruct-v1.5-F16.gguf new file mode 100644 index 0000000..e26b689 --- /dev/null +++ b/Meltemi-7B-Instruct-v1.5-F16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79b3de00de81bf4968ca8dc22f01aaf0f5901272390f738a02632e34256d48eb +size 14967052928 diff --git a/Meltemi-7B-Instruct-v1.5-F16.llamafile b/Meltemi-7B-Instruct-v1.5-F16.llamafile new file mode 100644 index 0000000..a187a4a --- /dev/null +++ b/Meltemi-7B-Instruct-v1.5-F16.llamafile @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20fa85ca5b6557ec2b4166f8a71b4454a6841ddfe5e0ec55a6997d5fb72236f1 +size 15208495275 diff --git a/Meltemi-7B-Instruct-v1.5-Q8_0.gguf b/Meltemi-7B-Instruct-v1.5-Q8_0.gguf new file mode 100644 index 0000000..513725b --- /dev/null +++ b/Meltemi-7B-Instruct-v1.5-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca6b3bad85d101199b102155e6dad839929b3911d44812499b74c361d1ad03c0 +size 7952509568 diff --git a/Meltemi-7B-Instruct-v1.5-Q8_0.llamafile b/Meltemi-7B-Instruct-v1.5-Q8_0.llamafile new file mode 100644 index 0000000..d1cf8b6 --- /dev/null +++ b/Meltemi-7B-Instruct-v1.5-Q8_0.llamafile @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22c6adfafcaf4ce00c7e2fa4b376c01dfc671a1adb05bfc99a81fdce9b426e50 +size 8193915053 diff --git a/README.md b/README.md new file mode 100644 index 0000000..fe9d7f8 --- /dev/null +++ b/README.md @@ -0,0 +1,104 @@ +--- +language: +- el +- en +license: apache-2.0 +pipeline_tag: text-generation +tags: +- finetuned +inference: true +base_model: +- ilsp/Meltemi-7B-Instruct-v1.5 +--- + +# Meltemi llamafile & gguf + +This repo contains `llamafile` and `gguf` file format models for [Meltemi 7B Instruct v1.5](https://huggingface.co/ilsp/Meltemi-7B-Instruct-v1.5), the first Greek Large Language Model (LLM), +trained by the Institute for Language and Speech Processing at Athena Research & Innovation Center. + +lamafile is a file format introduced by Mozilla Ocho on Nov 20th 2023, +and it collapses the complexity of an LLM into a single executable file. +This gives you the easiest, fastest way to use Meltemi on Linux, MacOS, Windows, FreeBSD, OpenBSD, and NetBSD systems you control on both AMD64 and ARM64. + +It's as simple as this + +```shell +wget https://huggingface.co/Florents-Tselai/Meltemi-llamafile/resolve/main/Meltemi-7B-Instruct-v1.5-Q8_0.llamafile +chmod +x Meltemi-7B-Instruct-v1.5-Q8_0.llamafile +``` + +```shell +./Meltemi-7B-Instruct-v1.5-Q8_0.llamafile +``` + +This will open a tab with a chatbot and completion interface in your browser. +For additional help on how it may be used, pass the `--help` flag. + +## API + +The server also has an OpenAI API-compatible completions endpoint. + +```shell +curl http://localhost:8080/v1/chat/completions \ +-H "Content-Type: application/json" \ +-H "Authorization: Bearer no-key" \ +-d '{ + "model": "LLaMA_CPP", + "messages": [ + { + "role": "system", + "content": "Είσαι ένας φωτεινός παντογνώστης" + }, + { + "role": "user", + "content": "Γράψε μου μια ιστορία για έναν βάτραχο που έγινε αρνάκι" + } + ] +}' +``` + +## CLI + +An advanced CLI mode is provided that's useful for shell scripting. +You can use it by passing the `--cli` flag. For additional help on how it may be used, pass the --help flag. + +```shell +./Meltemi-7B-Instruct-v1.5-Q8_0.llamafile -p 'Ποιό είναι το νόημα της ζωής;' +``` + +To see all available options + +```shell +./Meltemi-7B-Instruct-v1.5-Q8_0.llamafile --help +``` + +## gguf + +`gguf` file formats are also available if you're working with llama.cpp [llama.cpp](https://github.com/ggerganov/llama.cpp) + +llama.cpp offers quite a lot of options, thus refer to its documentation. + +### Basic Usage + +```shell +llama-cli -m ./Meltemi-7B-Instruct-v1.5-F16.gguf -p "Ποιό είναι το νόημα της ζωής;" -n 128 +``` + +### Conversation Mode + +```shell +llama-cli -m ./Meltemi-7B-Instruct-v1.5-F16.gguf --conv +``` + +### Web Server + +```shell +llama-server -m ./Meltemi-7B-Instruct-v1.5-F16.gguf --port 8080 +``` + +# Model Information + +- Vocabulary extension of the Mistral 7b tokenizer with Greek tokens for lower costs and faster inference (**1.52** vs. 6.80 tokens/word for Greek) +- 8192 context length + +For more details, please refer to the original model card [Meltemi 7B Instract v1.5](https://huggingface.co/ilsp/Meltemi-7B-Instruct-v1.5) diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file