From 5857f641afe4812a5e986b5232993370a91789f2 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Mon, 13 Apr 2026 19:48:04 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: afrideva/phi-2-chat-GGUF Source: Original Platform --- .gitattributes | 42 ++++++++++++++++++++ README.md | 87 ++++++++++++++++++++++++++++++++++++++++++ phi-2-chat.fp16.gguf | 3 ++ phi-2-chat.q2_k.gguf | 3 ++ phi-2-chat.q3_k_m.gguf | 3 ++ phi-2-chat.q4_k_m.gguf | 3 ++ phi-2-chat.q5_k_m.gguf | 3 ++ phi-2-chat.q6_k.gguf | 3 ++ phi-2-chat.q8_0.gguf | 3 ++ 9 files changed, 150 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 phi-2-chat.fp16.gguf create mode 100644 phi-2-chat.q2_k.gguf create mode 100644 phi-2-chat.q3_k_m.gguf create mode 100644 phi-2-chat.q4_k_m.gguf create mode 100644 phi-2-chat.q5_k_m.gguf create mode 100644 phi-2-chat.q6_k.gguf create mode 100644 phi-2-chat.q8_0.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..2381708 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,42 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +phi-2-chat.fp16.gguf filter=lfs diff=lfs merge=lfs -text +phi-2-chat.q2_k.gguf filter=lfs diff=lfs merge=lfs -text +phi-2-chat.q3_k_m.gguf filter=lfs diff=lfs merge=lfs -text +phi-2-chat.q4_k_m.gguf filter=lfs diff=lfs merge=lfs -text +phi-2-chat.q5_k_m.gguf filter=lfs diff=lfs merge=lfs -text +phi-2-chat.q6_k.gguf filter=lfs diff=lfs merge=lfs -text +phi-2-chat.q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..2a1819a --- /dev/null +++ b/README.md @@ -0,0 +1,87 @@ +--- +base_model: malhajar/phi-2-chat +datasets: +- yahma/alpaca-cleaned +inference: false +language: +- en +model_creator: malhajar +model_name: phi-2-chat +pipeline_tag: text-generation +quantized_by: afrideva +tags: +- gguf +- ggml +- quantized +- q2_k +- q3_k_m +- q4_k_m +- q5_k_m +- q6_k +- q8_0 +--- +# malhajar/phi-2-chat-GGUF + +Quantized GGUF model files for [phi-2-chat](https://huggingface.co/malhajar/phi-2-chat) from [malhajar](https://huggingface.co/malhajar) + + +| Name | Quant method | Size | +| ---- | ---- | ---- | +| [phi-2-chat.fp16.gguf](https://huggingface.co/afrideva/phi-2-chat-GGUF/resolve/main/phi-2-chat.fp16.gguf) | fp16 | 5.56 GB | +| [phi-2-chat.q2_k.gguf](https://huggingface.co/afrideva/phi-2-chat-GGUF/resolve/main/phi-2-chat.q2_k.gguf) | q2_k | 1.17 GB | +| [phi-2-chat.q3_k_m.gguf](https://huggingface.co/afrideva/phi-2-chat-GGUF/resolve/main/phi-2-chat.q3_k_m.gguf) | q3_k_m | 1.48 GB | +| [phi-2-chat.q4_k_m.gguf](https://huggingface.co/afrideva/phi-2-chat-GGUF/resolve/main/phi-2-chat.q4_k_m.gguf) | q4_k_m | 1.79 GB | +| [phi-2-chat.q5_k_m.gguf](https://huggingface.co/afrideva/phi-2-chat-GGUF/resolve/main/phi-2-chat.q5_k_m.gguf) | q5_k_m | 2.07 GB | +| [phi-2-chat.q6_k.gguf](https://huggingface.co/afrideva/phi-2-chat-GGUF/resolve/main/phi-2-chat.q6_k.gguf) | q6_k | 2.29 GB | +| [phi-2-chat.q8_0.gguf](https://huggingface.co/afrideva/phi-2-chat-GGUF/resolve/main/phi-2-chat.q8_0.gguf) | q8_0 | 2.96 GB | + + + +## Original Model Card: +# Model Card for Model ID + + +malhajar/phi-2-chat is a finetuned version of [`phi-2`]( https://huggingface.co/microsoft/phi-2) using SFT Training. +This model can answer information in a chat format as it is finetuned specifically on instructions specifically [`alpaca-cleaned`]( https://huggingface.co/datasets/yahma/alpaca-cleaned) + +### Model Description + +- **Developed by:** [`Mohamad Alhajar`](https://www.linkedin.com/in/muhammet-alhajar/) +- **Language(s) (NLP):** Turkish +- **Finetuned from model:** [`microsoft/phi-2`](https://huggingface.co/microsoft/phi-2) + +### Prompt Template +``` +### Instruction: + + (without the <>) + +### Response: +``` + +## How to Get Started with the Model + +Use the code sample provided in the original post to interact with the model. +```python +from transformers import AutoTokenizer,AutoModelForCausalLM + +model_id = "malhajar/phi-2-chat" +model = AutoModelForCausalLM.from_pretrained(model_name_or_path, + device_map="auto", + torch_dtype=torch.float16, + revision="main") + +tokenizer = AutoTokenizer.from_pretrained(model_id) + +question: "Türkiyenin en büyük şehir nedir?" +# For generating a response +prompt = ''' +### Instruction: {question} ### Response: +''' +input_ids = tokenizer(prompt, return_tensors="pt").input_ids +output = model.generate(inputs=input_ids,max_new_tokens=512,pad_token_id=tokenizer.eos_token_id,top_k=50, do_sample=True,repetition_penalty=1.3 + top_p=0.95,trust_remote_code=True,) +response = tokenizer.decode(output[0]) + +print(response) +``` \ No newline at end of file diff --git a/phi-2-chat.fp16.gguf b/phi-2-chat.fp16.gguf new file mode 100644 index 0000000..6b254f0 --- /dev/null +++ b/phi-2-chat.fp16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d89fdb6c770afb5367389d2648a206d66d80407e6abcc45dd3c7dbbd1aaa75c +size 5563088672 diff --git a/phi-2-chat.q2_k.gguf b/phi-2-chat.q2_k.gguf new file mode 100644 index 0000000..fc9bb81 --- /dev/null +++ b/phi-2-chat.q2_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27aa5606fa77f0ee881f89b700c15334dd48def3ec2f1b380f4780f0e227ce8a +size 1173610336 diff --git a/phi-2-chat.q3_k_m.gguf b/phi-2-chat.q3_k_m.gguf new file mode 100644 index 0000000..2fa2f3b --- /dev/null +++ b/phi-2-chat.q3_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67bea36a467bfb2f6c120a75af709a7d798cf61a2ed86d7d600ce10c5727d2d9 +size 1480195936 diff --git a/phi-2-chat.q4_k_m.gguf b/phi-2-chat.q4_k_m.gguf new file mode 100644 index 0000000..49add3c --- /dev/null +++ b/phi-2-chat.q4_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdfc5f093d0ac3e60bbb551e64a20f20cd93ab17c1671c726befe228080c656c +size 1789239136 diff --git a/phi-2-chat.q5_k_m.gguf b/phi-2-chat.q5_k_m.gguf new file mode 100644 index 0000000..7866e30 --- /dev/null +++ b/phi-2-chat.q5_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66abd86c56f3b438bc40ab39325b2c3c4c89df13675b4d3e0f22f92c2a53d842 +size 2072682336 diff --git a/phi-2-chat.q6_k.gguf b/phi-2-chat.q6_k.gguf new file mode 100644 index 0000000..9f0b7bc --- /dev/null +++ b/phi-2-chat.q6_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81b19e930952df4a1da9fd1b9e43c5f820f8c000279e4ad2bc78c6ca84f938a5 +size 2285059936 diff --git a/phi-2-chat.q8_0.gguf b/phi-2-chat.q8_0.gguf new file mode 100644 index 0000000..513a5cc --- /dev/null +++ b/phi-2-chat.q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2726b43e148806b95c9cef08e67bdf898719f750f510ef1e4f411f8d8d27965c +size 2958032736