From 45d9c23d0ba169cbcb19a8b1891be1e6038daf00 Mon Sep 17 00:00:00 2001
From: ModelHub XC <noreply@modelhub.org.cn>
Date: Tue, 9 Jun 2026 16:10:17 +0800
Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?=
 =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?=
 =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Model: Kortix/FastApply-7B-v1.0_GGUF
Source: Original Platform
---
 .gitattributes    |  41 ++++++++++++++++
 README.md         | 120 ++++++++++++++++++++++++++++++++++++++++++++++
 config.json       |   3 ++
 hf.Q4_K_M.gguf    |   3 ++
 hf.Q5_K_M.gguf    |   3 ++
 unsloth.F16.gguf  |   3 ++
 unsloth.Q8_0.gguf |   3 ++
 7 files changed, 176 insertions(+)
 create mode 100644 .gitattributes
 create mode 100644 README.md
 create mode 100644 config.json
 create mode 100644 hf.Q4_K_M.gguf
 create mode 100644 hf.Q5_K_M.gguf
 create mode 100644 unsloth.F16.gguf
 create mode 100644 unsloth.Q8_0.gguf

diff --git a/.gitattributes b/.gitattributes
new file mode 100644
index 0000000..e0bc186
--- /dev/null
+++ b/.gitattributes
@@ -0,0 +1,41 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+unsloth.F16.gguf filter=lfs diff=lfs merge=lfs -text
+unsloth.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
+fastapply-7b-v1.0-q4_k_m.gguf filter=lfs diff=lfs merge=lfs -text
+fastapply-7b-v1.0-q5_k_m.gguf filter=lfs diff=lfs merge=lfs -text
+hf.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+hf.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
diff --git a/README.md b/README.md
new file mode 100644
index 0000000..cd1435a
--- /dev/null
+++ b/README.md
@@ -0,0 +1,120 @@
+---
+base_model: unsloth/qwen2.5-coder-7b-instruct-bnb-4bit
+language:
+- en
+license: apache-2.0
+tags:
+- text-generation-inference
+- transformers
+- unsloth
+- qwen2
+- trl
+- sft
+- fast-apply
+- instant-apply
+---
+
+# FastApply-7B-v1.0
+
+[Github: kortix-ai/fast-apply](https://github.com/kortix-ai/fast-apply)   
+[Dataset: Kortix/FastApply-dataset-v1.0](https://huggingface.co/datasets/Kortix/FastApply-dataset-v1.0)    
+[Try it now on 👉 Google Colab](https://colab.research.google.com/drive/1aBqM8Lqso0Xfgtr75G4LFQivXcChU_36?usp=sharing)
+
+## Model Details
+
+### Basic Information
+
+- **Developed by:** Kortix
+- **License:** apache-2.0
+- **Finetuned from model:** [unsloth/Qwen2.5-Coder-7B-Instruct-bnb-4bit](https://huggingface.co/unsloth/Qwen2.5-Coder-7B-Instruct-bnb-4bit)
+
+### Model Description
+
+FastApply-7B-v1.0 is a 7B model designed for instant code application, producing full file edits to power [SoftGen AI](https://softgen.ai/).    
+It is part of the Fast Apply pipeline for data generation and fine-tuning Qwen2.5 Coder models.
+
+The model achieves high throughput when deployed on fast providers like Fireworks while maintaining high edit accuracy, with a speed of approximately 150 tokens/second.
+
+## Intended Use
+
+FastApply-7B-v1.0 is intended for use in AI-powered code editors and tools that require fast, accurate code modifications. It is particularly well-suited for:
+
+- Instant code application tasks
+- Full file edits
+- Integration with AI-powered code editors like Aider and PearAI
+- Local tools to reduce the cost of frontier model output
+
+## Inference template
+
+FastApply-7B-v1.0 is based on the Qwen2.5 Coder architecture and is fine-tuned for code editing tasks. It uses a specific prompt structure for inference:
+
+```
+<|im_start|>system
+You are a coding assistant that helps merge code updates, ensuring every modification is fully integrated.<|im_end|>
+<|im_start|>user
+Merge all changes from the <update> snippet into the <code> below.
+- Preserve the code's structure, order, comments, and indentation exactly.
+- Output only the updated code, enclosed within <updated-code> and </updated-code> tags.
+- Do not include any additional text, explanations, placeholders, ellipses, or code fences.
+
+<code>{original_code}</code>
+
+<update>{update_snippet}</update>
+
+Provide the complete updated code.<|im_end|>
+<|im_start|>assistant
+```
+
+The model's output is structured as:
+
+```
+<updated-code>[Full-complete updated file]</updated-code>
+```
+
+## Additional Information
+
+For more details on the Fast Apply pipeline, data generation process, and deployment instructions, please refer to the [GitHub repository](https://github.com/kortix-ai/fast-apply).
+
+## How to Use
+
+To use the model, you can load it using the Hugging Face Transformers library:
+
+
+```python
+from transformers import AutoModelForCausalLM, AutoTokenizer
+
+model = AutoModelForCausalLM.from_pretrained("Kortix/FastApply-7B-v1.0")
+tokenizer = AutoTokenizer.from_pretrained("Kortix/FastApply-7B-v1.0")
+
+# Prepare your input following the prompt structure mentioned above
+input_text = """<|im_start|>system
+You are a coding assistant that helps merge code updates, ensuring every modification is fully integrated.<|im_end|>
+<|im_start|>user
+Merge all changes from the <update> snippet into the <code> below.
+- Preserve the code's structure, order, comments, and indentation exactly.
+- Output only the updated code, enclosed within <updated-code> and </updated-code> tags.
+- Do not include any additional text, explanations, placeholders, ellipses, or code fences.
+
+<code>{original_code}</code>
+
+<update>{update_snippet}</update>
+
+Provide the complete updated code.<|im_end|>
+<|im_start|>assistant
+"""
+
+input_text = input_text.format(
+    original_code=original_code,
+    update_snippet=update_snippet,
+).strip() 
+
+# Generate the response
+input_ids = tokenizer.encode(input_text, return_tensors="pt")
+output = model.generate(input_ids, max_length=8192,)
+
+response = tokenizer.decode(output[0][len(input_ids[0]):])
+print(response)
+
+# Extract the updated code from the response
+updated_code = response.split("<updated-code>")[1].split("</updated-code>")[0]
+```
\ No newline at end of file
diff --git a/config.json b/config.json
new file mode 100644
index 0000000..5ca493c
--- /dev/null
+++ b/config.json
@@ -0,0 +1,3 @@
+{
+    "model_type": "qwen2"
+}
\ No newline at end of file
diff --git a/hf.Q4_K_M.gguf b/hf.Q4_K_M.gguf
new file mode 100644
index 0000000..af11e14
--- /dev/null
+++ b/hf.Q4_K_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7077ca675eeea5cbad509fc296edd50fafad6a32a7d1d9cffc263e4b764357ff
+size 4683072224
diff --git a/hf.Q5_K_M.gguf b/hf.Q5_K_M.gguf
new file mode 100644
index 0000000..2468b18
--- /dev/null
+++ b/hf.Q5_K_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1999e80bddab39b7b1cfa703f4a6820850f2a55278b3124cce2ec567a550150b
+size 5444829920
diff --git a/unsloth.F16.gguf b/unsloth.F16.gguf
new file mode 100644
index 0000000..a6b764b
--- /dev/null
+++ b/unsloth.F16.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b62582e11748abadb24329971d00d04d33ac4294c70c0ea92b53adc358d675e1
+size 15237851296
diff --git a/unsloth.Q8_0.gguf b/unsloth.Q8_0.gguf
new file mode 100644
index 0000000..7bd38e6
--- /dev/null
+++ b/unsloth.Q8_0.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1b0426a2fc786a9f8c557bc7b3429ccbc62ff4bd80a7bf9a75dfc971d893de1c
+size 8098523296