commit bd6240b88da4a384c66ed51b9da9f819483290c6 Author: ModelHub XC Date: Tue Apr 21 20:43:36 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..2cdd294 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,57 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q3_K.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q4_K.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q5_0.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q5_K.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q5_1.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +sparse_ft_en_sw.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..5fe54ae --- /dev/null +++ b/README.md @@ -0,0 +1,105 @@ +Quantization made by Richard Erkhov. + +[Github](https://github.com/RichardErkhov) + +[Discord](https://discord.gg/pvy7H8DZMG) + +[Request more models](https://github.com/RichardErkhov/quant_request) + + +sparse_ft_en_sw - GGUF +- Model creator: https://huggingface.co/Vivian12300/ +- Original model: https://huggingface.co/Vivian12300/sparse_ft_en_sw/ + + +| Name | Quant method | Size | +| ---- | ---- | ---- | +| [sparse_ft_en_sw.Q2_K.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q2_K.gguf) | Q2_K | 2.96GB | +| [sparse_ft_en_sw.IQ3_XS.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.IQ3_XS.gguf) | IQ3_XS | 3.28GB | +| [sparse_ft_en_sw.IQ3_S.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.IQ3_S.gguf) | IQ3_S | 3.43GB | +| [sparse_ft_en_sw.Q3_K_S.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q3_K_S.gguf) | Q3_K_S | 3.41GB | +| [sparse_ft_en_sw.IQ3_M.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.IQ3_M.gguf) | IQ3_M | 3.52GB | +| [sparse_ft_en_sw.Q3_K.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q3_K.gguf) | Q3_K | 3.74GB | +| [sparse_ft_en_sw.Q3_K_M.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q3_K_M.gguf) | Q3_K_M | 3.74GB | +| [sparse_ft_en_sw.Q3_K_L.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q3_K_L.gguf) | Q3_K_L | 4.03GB | +| [sparse_ft_en_sw.IQ4_XS.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.IQ4_XS.gguf) | IQ4_XS | 4.18GB | +| [sparse_ft_en_sw.Q4_0.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q4_0.gguf) | Q4_0 | 4.34GB | +| [sparse_ft_en_sw.IQ4_NL.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.IQ4_NL.gguf) | IQ4_NL | 4.38GB | +| [sparse_ft_en_sw.Q4_K_S.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q4_K_S.gguf) | Q4_K_S | 4.37GB | +| [sparse_ft_en_sw.Q4_K.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q4_K.gguf) | Q4_K | 4.58GB | +| [sparse_ft_en_sw.Q4_K_M.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q4_K_M.gguf) | Q4_K_M | 4.58GB | +| [sparse_ft_en_sw.Q4_1.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q4_1.gguf) | Q4_1 | 4.78GB | +| [sparse_ft_en_sw.Q5_0.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q5_0.gguf) | Q5_0 | 5.21GB | +| [sparse_ft_en_sw.Q5_K_S.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q5_K_S.gguf) | Q5_K_S | 5.21GB | +| [sparse_ft_en_sw.Q5_K.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q5_K.gguf) | Q5_K | 5.34GB | +| [sparse_ft_en_sw.Q5_K_M.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q5_K_M.gguf) | Q5_K_M | 5.34GB | +| [sparse_ft_en_sw.Q5_1.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q5_1.gguf) | Q5_1 | 5.65GB | +| [sparse_ft_en_sw.Q6_K.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q6_K.gguf) | Q6_K | 6.14GB | +| [sparse_ft_en_sw.Q8_0.gguf](https://huggingface.co/RichardErkhov/Vivian12300_-_sparse_ft_en_sw-gguf/blob/main/sparse_ft_en_sw.Q8_0.gguf) | Q8_0 | 7.95GB | + + + + +Original model description: +--- +library_name: transformers +license: llama3.1 +base_model: meta-llama/Llama-3.1-8B-Instruct +tags: +- trl +- sft +- generated_from_trainer +datasets: +- generator +model-index: +- name: sparse_ft_en_sw + results: [] +--- + + + +# sparse_ft_en_sw + +This model is a fine-tuned version of [meta-llama/Llama-3.1-8B-Instruct](https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct) on the generator dataset. + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 5e-05 +- train_batch_size: 1 +- eval_batch_size: 2 +- seed: 42 +- gradient_accumulation_steps: 16 +- total_train_batch_size: 16 +- optimizer: Use adafactor and the args are: +No additional optimizer arguments +- lr_scheduler_type: linear +- num_epochs: 5 + +### Training results + + + +### Framework versions + +- Transformers 4.46.3 +- Pytorch 2.3.1+cu121 +- Datasets 2.20.0 +- Tokenizers 0.20.3 + + diff --git a/sparse_ft_en_sw.IQ3_M.gguf b/sparse_ft_en_sw.IQ3_M.gguf new file mode 100644 index 0000000..ad8525d --- /dev/null +++ b/sparse_ft_en_sw.IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b50fa517e93c4785f660819a01752ee63b50a7a1e4d938ed37c87499e0335fe +size 3784828480 diff --git a/sparse_ft_en_sw.IQ3_S.gguf b/sparse_ft_en_sw.IQ3_S.gguf new file mode 100644 index 0000000..c88cb55 --- /dev/null +++ b/sparse_ft_en_sw.IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:309c1fdd019aca489de15526b475ae86b058d2a0b053554847c0c616bf5de984 +size 3682330176 diff --git a/sparse_ft_en_sw.IQ3_XS.gguf b/sparse_ft_en_sw.IQ3_XS.gguf new file mode 100644 index 0000000..626f61d --- /dev/null +++ b/sparse_ft_en_sw.IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849f86d669db38796b8c4763a5f266cf29a19a0ed1bf5330748444520ce3a478 +size 3518752320 diff --git a/sparse_ft_en_sw.IQ4_NL.gguf b/sparse_ft_en_sw.IQ4_NL.gguf new file mode 100644 index 0000000..30dc545 --- /dev/null +++ b/sparse_ft_en_sw.IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d958ffdb4e184d9bf7cff6c63c3162d6eb9397eec5aaefd83bc552faa7e41b69 +size 4707354176 diff --git a/sparse_ft_en_sw.IQ4_XS.gguf b/sparse_ft_en_sw.IQ4_XS.gguf new file mode 100644 index 0000000..16741eb --- /dev/null +++ b/sparse_ft_en_sw.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7290558dada26045adc7e3005e11f6c17b628ae5cf6c13af559a28a44c525fd0 +size 4484367936 diff --git a/sparse_ft_en_sw.Q2_K.gguf b/sparse_ft_en_sw.Q2_K.gguf new file mode 100644 index 0000000..423ee41 --- /dev/null +++ b/sparse_ft_en_sw.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:544cbc3875a61b649d9b7dbafbbfa9026f1d07742d94c2ccbbf3a13285ece854 +size 3179136576 diff --git a/sparse_ft_en_sw.Q3_K.gguf b/sparse_ft_en_sw.Q3_K.gguf new file mode 100644 index 0000000..820522e --- /dev/null +++ b/sparse_ft_en_sw.Q3_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:accb3639933b8a372cfe5816da97ac053e9a9f6f3fa9a5167a1e3dd33400d5ce +size 4018923072 diff --git a/sparse_ft_en_sw.Q3_K_L.gguf b/sparse_ft_en_sw.Q3_K_L.gguf new file mode 100644 index 0000000..ce723b5 --- /dev/null +++ b/sparse_ft_en_sw.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11647263d09c5fb6afb34a14b7e4c1ca6a99dc1662c32ffda94d913c8aa1e975 +size 4321961536 diff --git a/sparse_ft_en_sw.Q3_K_M.gguf b/sparse_ft_en_sw.Q3_K_M.gguf new file mode 100644 index 0000000..820522e --- /dev/null +++ b/sparse_ft_en_sw.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:accb3639933b8a372cfe5816da97ac053e9a9f6f3fa9a5167a1e3dd33400d5ce +size 4018923072 diff --git a/sparse_ft_en_sw.Q3_K_S.gguf b/sparse_ft_en_sw.Q3_K_S.gguf new file mode 100644 index 0000000..40d67e5 --- /dev/null +++ b/sparse_ft_en_sw.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:412b78d59f6d42925d58b9f06c83964bb6e26364a299632b97629e317e71032e +size 3664504384 diff --git a/sparse_ft_en_sw.Q4_0.gguf b/sparse_ft_en_sw.Q4_0.gguf new file mode 100644 index 0000000..ca0713a --- /dev/null +++ b/sparse_ft_en_sw.Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:045178338bee9877afd7d8b896e0ccf3a98fd27aa1ef1a6fc61934c26370b246 +size 4661216832 diff --git a/sparse_ft_en_sw.Q4_1.gguf b/sparse_ft_en_sw.Q4_1.gguf new file mode 100644 index 0000000..b28e91d --- /dev/null +++ b/sparse_ft_en_sw.Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be7ee25e8cbbb39cbfb670f1c7f681d4ed924debf750c4be69d8419b3e4e0ec4 +size 5130257984 diff --git a/sparse_ft_en_sw.Q4_K.gguf b/sparse_ft_en_sw.Q4_K.gguf new file mode 100644 index 0000000..6f83d88 --- /dev/null +++ b/sparse_ft_en_sw.Q4_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd37d11fd91ae00ba60a224781c5e06603e28d704ac09c8fc8c7d421f1ffa41c +size 4920739392 diff --git a/sparse_ft_en_sw.Q4_K_M.gguf b/sparse_ft_en_sw.Q4_K_M.gguf new file mode 100644 index 0000000..6f83d88 --- /dev/null +++ b/sparse_ft_en_sw.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd37d11fd91ae00ba60a224781c5e06603e28d704ac09c8fc8c7d421f1ffa41c +size 4920739392 diff --git a/sparse_ft_en_sw.Q4_K_S.gguf b/sparse_ft_en_sw.Q4_K_S.gguf new file mode 100644 index 0000000..1a0adb2 --- /dev/null +++ b/sparse_ft_en_sw.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:314c3b0a593c39081e900ab3951b9e8b2c13b1370bbc9bf062c9ac57bfe1f71c +size 4692674112 diff --git a/sparse_ft_en_sw.Q5_0.gguf b/sparse_ft_en_sw.Q5_0.gguf new file mode 100644 index 0000000..80341c5 --- /dev/null +++ b/sparse_ft_en_sw.Q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c3ab229355bf982674fcf3812f2a1458f0b85cd813ebebc47d21ac187389916 +size 5599299136 diff --git a/sparse_ft_en_sw.Q5_1.gguf b/sparse_ft_en_sw.Q5_1.gguf new file mode 100644 index 0000000..b12b6db --- /dev/null +++ b/sparse_ft_en_sw.Q5_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef7e780ff60d122b258ec2ae0128abbe98d21e02a8e4b93ea3ccbe5f7bc33c5 +size 6068340288 diff --git a/sparse_ft_en_sw.Q5_K.gguf b/sparse_ft_en_sw.Q5_K.gguf new file mode 100644 index 0000000..b95fcaa --- /dev/null +++ b/sparse_ft_en_sw.Q5_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fd44abb9dd6c3accc85f03fb202cf7ac76c47cd61fcd8cde64052f4ed32d4b2 +size 5732992576 diff --git a/sparse_ft_en_sw.Q5_K_M.gguf b/sparse_ft_en_sw.Q5_K_M.gguf new file mode 100644 index 0000000..b95fcaa --- /dev/null +++ b/sparse_ft_en_sw.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fd44abb9dd6c3accc85f03fb202cf7ac76c47cd61fcd8cde64052f4ed32d4b2 +size 5732992576 diff --git a/sparse_ft_en_sw.Q5_K_S.gguf b/sparse_ft_en_sw.Q5_K_S.gguf new file mode 100644 index 0000000..5a43ab1 --- /dev/null +++ b/sparse_ft_en_sw.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c5fc9fb439086bff3ee3f9ab6b03d4ed76efc516bf2ac726cf049fe72a4659a +size 5599299136 diff --git a/sparse_ft_en_sw.Q6_K.gguf b/sparse_ft_en_sw.Q6_K.gguf new file mode 100644 index 0000000..598ff42 --- /dev/null +++ b/sparse_ft_en_sw.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9c7a109a4dd929a877df0f96c43e4b4c1b3090369dacc9de44879a13b756e7d +size 6596011584 diff --git a/sparse_ft_en_sw.Q8_0.gguf b/sparse_ft_en_sw.Q8_0.gguf new file mode 100644 index 0000000..60722fb --- /dev/null +++ b/sparse_ft_en_sw.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ed160d45fd9bea3e44429a5dead42395d20095b6bc095f83dd08210991bcb8e +size 8540776000