From 45d9c23d0ba169cbcb19a8b1891be1e6038daf00 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Tue, 9 Jun 2026 16:10:17 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: Kortix/FastApply-7B-v1.0_GGUF Source: Original Platform --- .gitattributes | 41 ++++++++++++++++ README.md | 120 ++++++++++++++++++++++++++++++++++++++++++++++ config.json | 3 ++ hf.Q4_K_M.gguf | 3 ++ hf.Q5_K_M.gguf | 3 ++ unsloth.F16.gguf | 3 ++ unsloth.Q8_0.gguf | 3 ++ 7 files changed, 176 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 config.json create mode 100644 hf.Q4_K_M.gguf create mode 100644 hf.Q5_K_M.gguf create mode 100644 unsloth.F16.gguf create mode 100644 unsloth.Q8_0.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..e0bc186 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,41 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +unsloth.F16.gguf filter=lfs diff=lfs merge=lfs -text +unsloth.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +fastapply-7b-v1.0-q4_k_m.gguf filter=lfs diff=lfs merge=lfs -text +fastapply-7b-v1.0-q5_k_m.gguf filter=lfs diff=lfs merge=lfs -text +hf.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +hf.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..cd1435a --- /dev/null +++ b/README.md @@ -0,0 +1,120 @@ +--- +base_model: unsloth/qwen2.5-coder-7b-instruct-bnb-4bit +language: +- en +license: apache-2.0 +tags: +- text-generation-inference +- transformers +- unsloth +- qwen2 +- trl +- sft +- fast-apply +- instant-apply +--- + +# FastApply-7B-v1.0 + +[Github: kortix-ai/fast-apply](https://github.com/kortix-ai/fast-apply) +[Dataset: Kortix/FastApply-dataset-v1.0](https://huggingface.co/datasets/Kortix/FastApply-dataset-v1.0) +[Try it now on 👉 Google Colab](https://colab.research.google.com/drive/1aBqM8Lqso0Xfgtr75G4LFQivXcChU_36?usp=sharing) + +## Model Details + +### Basic Information + +- **Developed by:** Kortix +- **License:** apache-2.0 +- **Finetuned from model:** [unsloth/Qwen2.5-Coder-7B-Instruct-bnb-4bit](https://huggingface.co/unsloth/Qwen2.5-Coder-7B-Instruct-bnb-4bit) + +### Model Description + +FastApply-7B-v1.0 is a 7B model designed for instant code application, producing full file edits to power [SoftGen AI](https://softgen.ai/). +It is part of the Fast Apply pipeline for data generation and fine-tuning Qwen2.5 Coder models. + +The model achieves high throughput when deployed on fast providers like Fireworks while maintaining high edit accuracy, with a speed of approximately 150 tokens/second. + +## Intended Use + +FastApply-7B-v1.0 is intended for use in AI-powered code editors and tools that require fast, accurate code modifications. It is particularly well-suited for: + +- Instant code application tasks +- Full file edits +- Integration with AI-powered code editors like Aider and PearAI +- Local tools to reduce the cost of frontier model output + +## Inference template + +FastApply-7B-v1.0 is based on the Qwen2.5 Coder architecture and is fine-tuned for code editing tasks. It uses a specific prompt structure for inference: + +``` +<|im_start|>system +You are a coding assistant that helps merge code updates, ensuring every modification is fully integrated.<|im_end|> +<|im_start|>user +Merge all changes from the snippet into the below. +- Preserve the code's structure, order, comments, and indentation exactly. +- Output only the updated code, enclosed within and tags. +- Do not include any additional text, explanations, placeholders, ellipses, or code fences. + +{original_code} + +{update_snippet} + +Provide the complete updated code.<|im_end|> +<|im_start|>assistant +``` + +The model's output is structured as: + +``` +[Full-complete updated file] +``` + +## Additional Information + +For more details on the Fast Apply pipeline, data generation process, and deployment instructions, please refer to the [GitHub repository](https://github.com/kortix-ai/fast-apply). + +## How to Use + +To use the model, you can load it using the Hugging Face Transformers library: + + +```python +from transformers import AutoModelForCausalLM, AutoTokenizer + +model = AutoModelForCausalLM.from_pretrained("Kortix/FastApply-7B-v1.0") +tokenizer = AutoTokenizer.from_pretrained("Kortix/FastApply-7B-v1.0") + +# Prepare your input following the prompt structure mentioned above +input_text = """<|im_start|>system +You are a coding assistant that helps merge code updates, ensuring every modification is fully integrated.<|im_end|> +<|im_start|>user +Merge all changes from the snippet into the below. +- Preserve the code's structure, order, comments, and indentation exactly. +- Output only the updated code, enclosed within and tags. +- Do not include any additional text, explanations, placeholders, ellipses, or code fences. + +{original_code} + +{update_snippet} + +Provide the complete updated code.<|im_end|> +<|im_start|>assistant +""" + +input_text = input_text.format( + original_code=original_code, + update_snippet=update_snippet, +).strip() + +# Generate the response +input_ids = tokenizer.encode(input_text, return_tensors="pt") +output = model.generate(input_ids, max_length=8192,) + +response = tokenizer.decode(output[0][len(input_ids[0]):]) +print(response) + +# Extract the updated code from the response +updated_code = response.split("")[1].split("")[0] +``` \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000..5ca493c --- /dev/null +++ b/config.json @@ -0,0 +1,3 @@ +{ + "model_type": "qwen2" +} \ No newline at end of file diff --git a/hf.Q4_K_M.gguf b/hf.Q4_K_M.gguf new file mode 100644 index 0000000..af11e14 --- /dev/null +++ b/hf.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7077ca675eeea5cbad509fc296edd50fafad6a32a7d1d9cffc263e4b764357ff +size 4683072224 diff --git a/hf.Q5_K_M.gguf b/hf.Q5_K_M.gguf new file mode 100644 index 0000000..2468b18 --- /dev/null +++ b/hf.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1999e80bddab39b7b1cfa703f4a6820850f2a55278b3124cce2ec567a550150b +size 5444829920 diff --git a/unsloth.F16.gguf b/unsloth.F16.gguf new file mode 100644 index 0000000..a6b764b --- /dev/null +++ b/unsloth.F16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b62582e11748abadb24329971d00d04d33ac4294c70c0ea92b53adc358d675e1 +size 15237851296 diff --git a/unsloth.Q8_0.gguf b/unsloth.Q8_0.gguf new file mode 100644 index 0000000..7bd38e6 --- /dev/null +++ b/unsloth.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b0426a2fc786a9f8c557bc7b3429ccbc62ff4bd80a7bf9a75dfc971d893de1c +size 8098523296