From 2800de32dba571bbf8374105e18b8e52e4800ab7 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 15 May 2026 20:09:06 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: hassanaitnacer/wav2vec2-large-xlsr-moroccan-darija-v4 Source: Original Platform --- .gitattributes | 35 ++++++ README.md | 64 ++++++++++ added_tokens.json | 8 ++ config.json | 117 ++++++++++++++++++ model.safetensors | 3 + preprocessor_config.json | 9 ++ ...out.tfevents.1720093200.31c1ed75f77e.719.0 | 3 + special_tokens_map.json | 30 +++++ tokenizer_config.json | 79 ++++++++++++ training_args.bin | 3 + vocab.json | 67 ++++++++++ 11 files changed, 418 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 added_tokens.json create mode 100644 config.json create mode 100644 model.safetensors create mode 100644 preprocessor_config.json create mode 100644 runs/Jul04_11-33-22_31c1ed75f77e/events.out.tfevents.1720093200.31c1ed75f77e.719.0 create mode 100644 special_tokens_map.json create mode 100644 tokenizer_config.json create mode 100644 training_args.bin create mode 100644 vocab.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..a6344aa --- /dev/null +++ b/.gitattributes @@ -0,0 +1,35 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..13acdb2 --- /dev/null +++ b/README.md @@ -0,0 +1,64 @@ +--- +license: apache-2.0 +base_model: hassanaitnacer/wav2vec2-large-xlsr-moroccan-darija-v3 +tags: +- generated_from_trainer +metrics: +- wer +model-index: +- name: wav2vec2-large-xlsr-moroccan-darija-v4 + results: [] +--- + + + +# wav2vec2-large-xlsr-moroccan-darija-v4 + +This model is a fine-tuned version of [hassanaitnacer/wav2vec2-large-xlsr-moroccan-darija-v3](https://huggingface.co/hassanaitnacer/wav2vec2-large-xlsr-moroccan-darija-v3) on an unknown dataset. +It achieves the following results on the evaluation set: +- Loss: 0.0394 +- Wer: 0.0816 + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 0.0001 +- train_batch_size: 16 +- eval_batch_size: 8 +- seed: 42 +- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08 +- lr_scheduler_type: linear +- lr_scheduler_warmup_steps: 500 +- num_epochs: 4 +- mixed_precision_training: Native AMP + +### Training results + +| Training Loss | Epoch | Step | Validation Loss | Wer | +|:-------------:|:------:|:----:|:---------------:|:------:| +| 0.0512 | 1.0225 | 500 | 0.0410 | 0.0872 | +| 0.0629 | 2.0450 | 1000 | 0.0508 | 0.0844 | +| 0.0384 | 3.0675 | 1500 | 0.0394 | 0.0816 | + + +### Framework versions + +- Transformers 4.43.0.dev0 +- Pytorch 2.3.0+cu121 +- Datasets 2.20.0 +- Tokenizers 0.19.1 diff --git a/added_tokens.json b/added_tokens.json new file mode 100644 index 0000000..330a7ab --- /dev/null +++ b/added_tokens.json @@ -0,0 +1,8 @@ +{ + "": 66, + "": 65, + "پ": 70, + "چ": 68, + "ڤ": 67, + "گ": 69 +} diff --git a/config.json b/config.json new file mode 100644 index 0000000..9e78291 --- /dev/null +++ b/config.json @@ -0,0 +1,117 @@ +{ + "_name_or_path": "hassanaitnacer/wav2vec2-large-xlsr-moroccan-darija-v3", + "activation_dropout": 0.0, + "adapter_attn_dim": null, + "adapter_kernel_size": 3, + "adapter_stride": 2, + "add_adapter": false, + "apply_spec_augment": true, + "architectures": [ + "Wav2Vec2ForCTC" + ], + "attention_dropout": 0.0, + "bos_token_id": 1, + "classifier_proj_size": 256, + "codevector_dim": 768, + "contrastive_logits_temperature": 0.1, + "conv_bias": true, + "conv_dim": [ + 512, + 512, + 512, + 512, + 512, + 512, + 512 + ], + "conv_kernel": [ + 10, + 3, + 3, + 3, + 3, + 2, + 2 + ], + "conv_stride": [ + 5, + 2, + 2, + 2, + 2, + 2, + 2 + ], + "ctc_loss_reduction": "mean", + "ctc_zero_infinity": false, + "diversity_loss_weight": 0.1, + "do_stable_layer_norm": true, + "eos_token_id": 2, + "feat_extract_activation": "gelu", + "feat_extract_dropout": 0.0, + "feat_extract_norm": "layer", + "feat_proj_dropout": 0.0, + "feat_quantizer_dropout": 0.0, + "final_dropout": 0.0, + "gradient_checkpointing": false, + "hidden_act": "gelu", + "hidden_dropout": 0.0, + "hidden_size": 1024, + "initializer_range": 0.02, + "intermediate_size": 4096, + "layer_norm_eps": 1e-05, + "layerdrop": 0.0, + "mask_channel_length": 10, + "mask_channel_min_space": 1, + "mask_channel_other": 0.0, + "mask_channel_prob": 0.0, + "mask_channel_selection": "static", + "mask_feature_length": 10, + "mask_feature_min_masks": 0, + "mask_feature_prob": 0.0, + "mask_time_length": 10, + "mask_time_min_masks": 2, + "mask_time_min_space": 1, + "mask_time_other": 0.0, + "mask_time_prob": 0.05, + "mask_time_selection": "static", + "model_type": "wav2vec2", + "num_adapter_layers": 3, + "num_attention_heads": 16, + "num_codevector_groups": 2, + "num_codevectors_per_group": 320, + "num_conv_pos_embedding_groups": 16, + "num_conv_pos_embeddings": 128, + "num_feat_extract_layers": 7, + "num_hidden_layers": 24, + "num_negatives": 100, + "output_hidden_size": 1024, + "pad_token_id": 64, + "proj_codevector_dim": 768, + "tdnn_dilation": [ + 1, + 2, + 3, + 1, + 1 + ], + "tdnn_dim": [ + 512, + 512, + 512, + 512, + 1500 + ], + "tdnn_kernel": [ + 5, + 3, + 3, + 1, + 1 + ], + "torch_dtype": "float32", + "transformers_version": "4.43.0.dev0", + "use_weighted_layer_sum": false, + "vocab_size": 71, + "xvector_output_dim": 512 +} diff --git a/model.safetensors b/model.safetensors new file mode 100644 index 0000000..d1983e5 --- /dev/null +++ b/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4549d68408e72256503148794dd4fe8056e4bfcd701b69d970b72a35b2358372 +size 1262098580 diff --git a/preprocessor_config.json b/preprocessor_config.json new file mode 100644 index 0000000..73caa15 --- /dev/null +++ b/preprocessor_config.json @@ -0,0 +1,9 @@ +{ + "do_normalize": true, + "feature_extractor_type": "Wav2Vec2FeatureExtractor", + "feature_size": 1, + "padding_side": "right", + "padding_value": 0.0, + "return_attention_mask": true, + "sampling_rate": 16000 +} diff --git a/runs/Jul04_11-33-22_31c1ed75f77e/events.out.tfevents.1720093200.31c1ed75f77e.719.0 b/runs/Jul04_11-33-22_31c1ed75f77e/events.out.tfevents.1720093200.31c1ed75f77e.719.0 new file mode 100644 index 0000000..8322222 --- /dev/null +++ b/runs/Jul04_11-33-22_31c1ed75f77e/events.out.tfevents.1720093200.31c1ed75f77e.719.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337c7584b1387fbe73ec94d4d2aacc0f35091dbd88c7a91355daa48fe7ea53b6 +size 8638 diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..7f1669a --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,30 @@ +{ + "bos_token": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "eos_token": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "[PAD]", + "lstrip": true, + "normalized": false, + "rstrip": true, + "single_word": false + }, + "unk_token": { + "content": "[UNK]", + "lstrip": true, + "normalized": false, + "rstrip": true, + "single_word": false + } +} diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..04d04f7 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,79 @@ +{ + "added_tokens_decoder": { + "63": { + "content": "[UNK]", + "lstrip": true, + "normalized": false, + "rstrip": true, + "single_word": false, + "special": false + }, + "64": { + "content": "[PAD]", + "lstrip": true, + "normalized": false, + "rstrip": true, + "single_word": false, + "special": false + }, + "65": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "66": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "67": { + "content": "ڤ", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "68": { + "content": "چ", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "69": { + "content": "گ", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "70": { + "content": "پ", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "bos_token": "", + "clean_up_tokenization_spaces": true, + "do_lower_case": false, + "eos_token": "", + "model_max_length": 1000000000000000019884624838656, + "pad_token": "[PAD]", + "replace_word_delimiter_char": " ", + "target_lang": null, + "tokenizer_class": "Wav2Vec2CTCTokenizer", + "unk_token": "[UNK]", + "word_delimiter_token": "|" +} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000..fa67683 --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feaa51f2f7cbdb3b341761d711e13f05045c7d424d06f97f5e30b94177147945 +size 5240 diff --git a/vocab.json b/vocab.json new file mode 100644 index 0000000..f88e70c --- /dev/null +++ b/vocab.json @@ -0,0 +1,67 @@ +{ + "\n": 58, + "@": 5, + "[PAD]": 64, + "[UNK]": 63, + "_": 1, + "a": 53, + "c": 45, + "d": 16, + "e": 47, + "h": 49, + "i": 23, + "k": 27, + "n": 14, + "o": 51, + "p": 55, + "r": 24, + "s": 31, + "t": 32, + "v": 25, + "|": 2, + "؟": 48, + "ء": 29, + "آ": 10, + "أ": 56, + "ؤ": 36, + "إ": 62, + "ئ": 17, + "ا": 0, + "ب": 50, + "ة": 18, + "ت": 43, + "ث": 13, + "ج": 15, + "ح": 60, + "خ": 59, + "د": 54, + "ذ": 6, + "ر": 30, + "ز": 20, + "س": 52, + "ش": 8, + "ص": 11, + "ض": 38, + "ط": 42, + "ظ": 46, + "ع": 21, + "غ": 9, + "ـ": 34, + "ف": 22, + "ق": 37, + "ك": 3, + "ل": 40, + "م": 39, + "ن": 4, + "ه": 19, + "و": 61, + "ى": 33, + "ي": 12, + "ِ": 28, + "ّ": 44, + "ْ": 57, + "ٖ": 7, + "ڸ": 26, + " ": 35, + "…": 41 +}