57 lines
1.4 KiB
JSON
57 lines
1.4 KiB
JSON
|
|
{
|
||
|
|
"experiment_info": {
|
||
|
|
"model_name": "facebook/wav2vec2-large-xlsr-53",
|
||
|
|
"model_description": "XLSR-53",
|
||
|
|
"dataset_name": "h3llohihi/lao-asr-thesis-dataset",
|
||
|
|
"training_date": "2025-06-03 19:11:56",
|
||
|
|
"vocab_size": 55,
|
||
|
|
"primary_metric": "cer"
|
||
|
|
},
|
||
|
|
"training_config": {
|
||
|
|
"dataset_name": "h3llohihi/lao-asr-thesis-dataset",
|
||
|
|
"gradient_accumulation": 1,
|
||
|
|
"weight_decay": 0.01,
|
||
|
|
"warmup_steps": 400,
|
||
|
|
"num_epochs": 15,
|
||
|
|
"max_steps": -1,
|
||
|
|
"eval_steps": 250,
|
||
|
|
"save_steps": 500,
|
||
|
|
"logging_steps": 50,
|
||
|
|
"early_stopping_patience": 6,
|
||
|
|
"dataloader_workers": 8,
|
||
|
|
"use_fp16": false,
|
||
|
|
"gradient_checkpointing": true,
|
||
|
|
"label_smoothing": 0.0,
|
||
|
|
"primary_metric": "cer",
|
||
|
|
"secondary_metric": "wer",
|
||
|
|
"logs_dir": "./logs",
|
||
|
|
"model_name": "facebook/wav2vec2-large-xlsr-53",
|
||
|
|
"description": "XLSR-53",
|
||
|
|
"output_dir": "./lao-asr-xlsr-53",
|
||
|
|
"batch_size": 16,
|
||
|
|
"learning_rate": 0.0001
|
||
|
|
},
|
||
|
|
"results": {
|
||
|
|
"validation": {
|
||
|
|
"cer": 0.16520911038806443,
|
||
|
|
"wer": 1.0,
|
||
|
|
"loss": 0.48708805441856384
|
||
|
|
},
|
||
|
|
"test": {
|
||
|
|
"cer": 0.16219106723220977,
|
||
|
|
"wer": 0.9958333333333333,
|
||
|
|
"loss": 0.41934534907341003
|
||
|
|
},
|
||
|
|
"dev": {
|
||
|
|
"cer": 0.10665818490245971,
|
||
|
|
"wer": 0.975,
|
||
|
|
"loss": 0.1934221088886261
|
||
|
|
}
|
||
|
|
},
|
||
|
|
"training_metrics": {
|
||
|
|
"final_loss": 1.7461039689566584,
|
||
|
|
"training_time": 12829.0071,
|
||
|
|
"samples_per_second": 4.499,
|
||
|
|
"total_steps": 0
|
||
|
|
}
|
||
|
|
}
|