33 lines
902 B
JSON
33 lines
902 B
JSON
|
|
{
|
||
|
|
"experiment_id": "ML-ENG-LUG-FULL-A40",
|
||
|
|
"base_model": "Sunbird/asr-whisper-large-v3-salt",
|
||
|
|
"languages": [
|
||
|
|
"lug",
|
||
|
|
"eng"
|
||
|
|
],
|
||
|
|
"training_method": "full",
|
||
|
|
"lora_r": 16,
|
||
|
|
"lora_alpha": 32,
|
||
|
|
"lora_dropout": 0.15,
|
||
|
|
"learning_rate": 1e-05,
|
||
|
|
"optimizer": "adamw_torch_fused",
|
||
|
|
"effective_batch_size": 16,
|
||
|
|
"train_metrics": {
|
||
|
|
"train_runtime": 23999.707,
|
||
|
|
"train_samples_per_second": 1.667,
|
||
|
|
"train_steps_per_second": 0.104,
|
||
|
|
"total_flos": 1.3582858479796224e+20,
|
||
|
|
"train_loss": 0.6222768672943115,
|
||
|
|
"epoch": 3.613048978854148
|
||
|
|
},
|
||
|
|
"test_metrics": {
|
||
|
|
"test_loss": 0.5511467456817627,
|
||
|
|
"test_wer": 0.34776840202900167,
|
||
|
|
"test_cer": 0.18876529976505252,
|
||
|
|
"test_runtime": 1854.5701,
|
||
|
|
"test_samples_per_second": 1.1,
|
||
|
|
"test_steps_per_second": 0.275,
|
||
|
|
"epoch": 3.613048978854148
|
||
|
|
},
|
||
|
|
"hub_repo_id": "KasuleTrevor/cdli-whisper-ml-eng-lug-full-a40"
|
||
|
|
}
|