From 87dd5b90e5d88f0f7e384ffe63485b98cef56bf6 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Wed, 17 Jun 2026 22:05:20 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: IlyaGusev/saiga2_7b_gguf Source: Original Platform --- .gitattributes | 41 +++++++++++++++++++++++++++++++++++++++++ README.md | 36 ++++++++++++++++++++++++++++++++++++ model-q2_K.gguf | 3 +++ model-q3_K.gguf | 3 +++ model-q4_K.gguf | 3 +++ model-q5_K.gguf | 3 +++ model-q8_0.gguf | 3 +++ 7 files changed, 92 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 model-q2_K.gguf create mode 100644 model-q3_K.gguf create mode 100644 model-q4_K.gguf create mode 100644 model-q5_K.gguf create mode 100644 model-q8_0.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..b40a078 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,41 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +*.gguf filter=lfs diff=lfs merge=lfs -text +model-q2_K.gguf filter=lfs diff=lfs merge=lfs -text +model-q3_K.gguf filter=lfs diff=lfs merge=lfs -text +model-q4_K.gguf filter=lfs diff=lfs merge=lfs -text +model-q5_K.gguf filter=lfs diff=lfs merge=lfs -text +model-q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..0f084d4 --- /dev/null +++ b/README.md @@ -0,0 +1,36 @@ +--- +datasets: +- IlyaGusev/ru_turbo_alpaca +- IlyaGusev/ru_turbo_saiga +- IlyaGusev/ru_sharegpt_cleaned +- IlyaGusev/oasst1_ru_main_branch +- IlyaGusev/ru_turbo_alpaca_evol_instruct +- lksy/ru_instruct_gpt4 +language: +- ru +inference: false +pipeline_tag: conversational +license: llama2 +--- + +Llama.cpp compatible versions of an original [7B model](https://huggingface.co/IlyaGusev/saiga2_7b_lora). + +Download one of the versions, for example `model-q4_K.gguf`. +``` +wget https://huggingface.co/IlyaGusev/saiga2_7b_gguf/resolve/main/model-q4_K.gguf +``` + +Download [interact_llamacpp.py](https://raw.githubusercontent.com/IlyaGusev/rulm/master/self_instruct/src/interact_llamacpp.py) +``` +wget https://raw.githubusercontent.com/IlyaGusev/rulm/master/self_instruct/src/interact_llamacpp.py +``` + +How to run: +``` +pip install llama-cpp-python fire + +python3 interact_llamacpp.py model-q4_K.gguf +``` + +System requirements: +* 10GB RAM for q8_0 and less for smaller quantizations diff --git a/model-q2_K.gguf b/model-q2_K.gguf new file mode 100644 index 0000000..ab10ce9 --- /dev/null +++ b/model-q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecdb8ac229f6cdc3f21d5a3e95dcd26f31c355b727299e96b44ab7a7dbc34fb4 +size 2825940544 diff --git a/model-q3_K.gguf b/model-q3_K.gguf new file mode 100644 index 0000000..5b726a8 --- /dev/null +++ b/model-q3_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04ec17b11219d55186d69deae515ec909ea54ecd5918b803f8deabd7a575396c +size 3298004544 diff --git a/model-q4_K.gguf b/model-q4_K.gguf new file mode 100644 index 0000000..801400d --- /dev/null +++ b/model-q4_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6d9ab608346c90e70eae6ab086524550c7ff5d5a34e6eb98b5b0531ef62b991 +size 4081004096 diff --git a/model-q5_K.gguf b/model-q5_K.gguf new file mode 100644 index 0000000..9e6843f --- /dev/null +++ b/model-q5_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:149862753771f3a096e05b3732c520d37d8a2b099b795a4434b813fe989d1f58 +size 4783156800 diff --git a/model-q8_0.gguf b/model-q8_0.gguf new file mode 100644 index 0000000..0660285 --- /dev/null +++ b/model-q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c51054fa221c692ba2cee0ebfa63e87c1fed2abdf8608bb820c5c1b58c5c22c +size 7161089600