From 0c93d797003475087372ccdae03edfed5b01ad64 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Wed, 27 May 2026 08:08:16 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: kth8/gemma-3-270m-it-JSON-Fixer-GGUF Source: Original Platform --- .gitattributes | 40 +++++++++++ README.md | 97 ++++++++++++++++++++++++++ gemma-3-270m-it-JSON-Fixer-Q4_0.gguf | 3 + gemma-3-270m-it-JSON-Fixer-Q4_K_M.gguf | 3 + gemma-3-270m-it-JSON-Fixer-Q6_K.gguf | 3 + gemma-3-270m-it-JSON-Fixer-Q8_0.gguf | 3 + gemma-3-270m-it-JSON-Fixer-bf16.gguf | 3 + 7 files changed, 152 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 gemma-3-270m-it-JSON-Fixer-Q4_0.gguf create mode 100644 gemma-3-270m-it-JSON-Fixer-Q4_K_M.gguf create mode 100644 gemma-3-270m-it-JSON-Fixer-Q6_K.gguf create mode 100644 gemma-3-270m-it-JSON-Fixer-Q8_0.gguf create mode 100644 gemma-3-270m-it-JSON-Fixer-bf16.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..8445ee4 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,40 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +gemma-3-270m-it-JSON-Fixer-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +gemma-3-270m-it-JSON-Fixer-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +gemma-3-270m-it-JSON-Fixer-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +gemma-3-270m-it-JSON-Fixer-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +gemma-3-270m-it-JSON-Fixer-bf16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..3874695 --- /dev/null +++ b/README.md @@ -0,0 +1,97 @@ +--- +license: gemma +language: +- en +base_model: kth8/gemma-3-270m-it-JSON-Fixer +datasets: +- kth8/json-fix-25000x +pipeline_tag: text-generation +library_name: transformers +tags: +- sft +- trl +- unsloth +- google +- gemma +- gemma3 +- gemma3_text +--- +![logo](https://storage.googleapis.com/gweb-developer-goog-blog-assets/images/gemma-3_2.original.png) +A fine-tune of [unsloth/gemma-3-270m-it](https://huggingface.co/unsloth/gemma-3-270m-it) on the [kth8/json-fix-25000x](https://huggingface.co/datasets/kth8/json-fix-25000x) dataset. + +## Usage example +**System prompt** +``` +You are a JSON formatting specialist. Convert the provided JSON data into valid JSON format with 2 line indent and no additional commentary. +``` +**User prompt** +``` +The JSON is:\n[{\"name\":\"John Doe\", \"jobTitle\":Software Engineer, \"department\": \"Research and Development\"],, {\"name\"\"Jane Smith\", \"jobTitle\":\"Data Analyst', \"department\":\"Marketing and Sales\"}, ] //\" comment\n-- end -- +``` +**Assistant response** +``` +[ + { + "name": "John Doe", + "jobTitle": "Software Engineer", + "department": "Research and Development" + }, + { + "name": "Jane Smith", + "jobTitle": "Data Analyst", + "department": "Marketing and Sales" + } +] +``` +## Model Details +- Base Model: `unsloth/gemma-3-270m-it` +- Parameter Count: 268,098,176 +- Precision: torch.bfloat16 + +### Hardware +- GPU: NVIDIA RTX PRO 6000 Blackwell Server Edition +- Announced: Mar 17th, 2025 +- Release Date: Mar 18th, 2025 +- Memory Type: GDDR7 +- Bandwidth: 1.79 TB/s +- Memory Size: 96 GB +- Memory Bus: 512 bit +- Shading Units: 24064 +- TDP: 600W +- FP16 (half): 126.0 TFLOPS (1:1) + +## Training Settings +### PEFT +- Rank: 32 +- LoRA alpha: 64 +- Modules: q_proj, k_proj, v_proj, o_proj, gate_proj, up_proj, down_proj +- Gradient checkpointing: unsloth + +### SFT +- Epoch: 2 +- Batch size: 32 +- Gradient Accumulation steps: 1 +- Warmup ratio: 0.05 +- Learning rate: 0.0004 +- Optimizer: adamw_torch_fused +- Learning rate scheduler: cosine +- Max seq length: 2048 + +## Training stats +- Date: 2026-03-23T04:39:38.019077 +- Peak VRAM usage: 64.5 GB +- Global step: 1538 +- Training runtime (seconds): 1142.9274 +- Average training loss: 0.004019292104312295 +- Final validation loss: 0.0014343492221087217 + +## Framework versions +- Unsloth: 2026.3.10 +- TRL: 0.22.2 +- Transformers: 4.56.2 +- Pytorch: 2.10.0+cu128 +- Datasets: 4.8.3 +- Tokenizers: 0.22.2 + +## License +This model is released under the Gemma license. See the [Gemma Terms of Use](https://ai.google.dev/gemma/terms) and [Prohibited Use Policy](https://policies.google.com/terms/generative-ai/use-policy) regarding the use of Gemma-generated content. \ No newline at end of file diff --git a/gemma-3-270m-it-JSON-Fixer-Q4_0.gguf b/gemma-3-270m-it-JSON-Fixer-Q4_0.gguf new file mode 100644 index 0000000..56e9212 --- /dev/null +++ b/gemma-3-270m-it-JSON-Fixer-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc2374f4060377dec1c1bea8f6b9040fa7f475c23ed613d886160d72fb0f7c35 +size 241411072 diff --git a/gemma-3-270m-it-JSON-Fixer-Q4_K_M.gguf b/gemma-3-270m-it-JSON-Fixer-Q4_K_M.gguf new file mode 100644 index 0000000..2c4606b --- /dev/null +++ b/gemma-3-270m-it-JSON-Fixer-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0f6252ab0032ee144fd66823537b434a1881774639935c7ac89568b9f7a8a22 +size 253115392 diff --git a/gemma-3-270m-it-JSON-Fixer-Q6_K.gguf b/gemma-3-270m-it-JSON-Fixer-Q6_K.gguf new file mode 100644 index 0000000..04fb473 --- /dev/null +++ b/gemma-3-270m-it-JSON-Fixer-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:644f67a813b8e94b77bf9025663233d03a4b420dabbae9b883f3f8df2571a2a8 +size 282975232 diff --git a/gemma-3-270m-it-JSON-Fixer-Q8_0.gguf b/gemma-3-270m-it-JSON-Fixer-Q8_0.gguf new file mode 100644 index 0000000..9870989 --- /dev/null +++ b/gemma-3-270m-it-JSON-Fixer-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e642c6b0350a52774b186a43bb1f7472c87b83a2c08ded46be14a713bc530c47 +size 291546112 diff --git a/gemma-3-270m-it-JSON-Fixer-bf16.gguf b/gemma-3-270m-it-JSON-Fixer-bf16.gguf new file mode 100644 index 0000000..da07415 --- /dev/null +++ b/gemma-3-270m-it-JSON-Fixer-bf16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22c3a9fa0e5b456061d41517631924ed994d3f80ddba829cc6591e64992cfe6b +size 542835712