|
{ |
|
"best_metric": 0.3285630841121495, |
|
"best_model_checkpoint": "/content/drive/MyDrive/wav2vec2-large-xlsr-persian-asr-shemo_me7494/checkpoint-1700", |
|
"epoch": 12.5, |
|
"eval_steps": 100, |
|
"global_step": 2000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.62, |
|
"learning_rate": 1.98e-06, |
|
"loss": 1.8553, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.62, |
|
"eval_loss": 1.4126451015472412, |
|
"eval_runtime": 35.7389, |
|
"eval_samples_per_second": 7.947, |
|
"eval_steps_per_second": 1.007, |
|
"eval_wer": 0.48656542056074764, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"learning_rate": 3.980000000000001e-06, |
|
"loss": 1.4083, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"eval_loss": 1.0428400039672852, |
|
"eval_runtime": 35.3623, |
|
"eval_samples_per_second": 8.031, |
|
"eval_steps_per_second": 1.018, |
|
"eval_wer": 0.4366238317757009, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.88, |
|
"learning_rate": 5.98e-06, |
|
"loss": 1.1718, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 1.88, |
|
"eval_loss": 0.86826491355896, |
|
"eval_runtime": 34.9958, |
|
"eval_samples_per_second": 8.115, |
|
"eval_steps_per_second": 1.029, |
|
"eval_wer": 0.4126752336448598, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 2.5, |
|
"learning_rate": 7.980000000000002e-06, |
|
"loss": 0.9919, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 2.5, |
|
"eval_loss": 0.7921169996261597, |
|
"eval_runtime": 33.9628, |
|
"eval_samples_per_second": 8.362, |
|
"eval_steps_per_second": 1.06, |
|
"eval_wer": 0.3919392523364486, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 3.12, |
|
"learning_rate": 9.980000000000001e-06, |
|
"loss": 0.9493, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.12, |
|
"eval_loss": 0.7675915360450745, |
|
"eval_runtime": 34.6559, |
|
"eval_samples_per_second": 8.195, |
|
"eval_steps_per_second": 1.039, |
|
"eval_wer": 0.3744158878504673, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.75, |
|
"learning_rate": 9.346666666666666e-06, |
|
"loss": 0.9414, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 3.75, |
|
"eval_loss": 0.7247262597084045, |
|
"eval_runtime": 34.016, |
|
"eval_samples_per_second": 8.349, |
|
"eval_steps_per_second": 1.058, |
|
"eval_wer": 0.3694509345794392, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 4.38, |
|
"learning_rate": 8.68e-06, |
|
"loss": 0.8897, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 4.38, |
|
"eval_loss": 0.720245897769928, |
|
"eval_runtime": 35.0175, |
|
"eval_samples_per_second": 8.11, |
|
"eval_steps_per_second": 1.028, |
|
"eval_wer": 0.3598130841121495, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 8.013333333333333e-06, |
|
"loss": 0.8716, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_loss": 0.7095639109611511, |
|
"eval_runtime": 34.2057, |
|
"eval_samples_per_second": 8.303, |
|
"eval_steps_per_second": 1.052, |
|
"eval_wer": 0.35455607476635514, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 5.62, |
|
"learning_rate": 7.346666666666668e-06, |
|
"loss": 0.8467, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 5.62, |
|
"eval_loss": 0.7023197412490845, |
|
"eval_runtime": 34.5651, |
|
"eval_samples_per_second": 8.216, |
|
"eval_steps_per_second": 1.042, |
|
"eval_wer": 0.34988317757009346, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 6.25, |
|
"learning_rate": 6.680000000000001e-06, |
|
"loss": 0.8227, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 6.25, |
|
"eval_loss": 0.6994471549987793, |
|
"eval_runtime": 35.0644, |
|
"eval_samples_per_second": 8.099, |
|
"eval_steps_per_second": 1.027, |
|
"eval_wer": 0.3411214953271028, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 6.88, |
|
"learning_rate": 6.013333333333335e-06, |
|
"loss": 0.855, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 6.88, |
|
"eval_loss": 0.6882991790771484, |
|
"eval_runtime": 33.9338, |
|
"eval_samples_per_second": 8.369, |
|
"eval_steps_per_second": 1.061, |
|
"eval_wer": 0.3431658878504673, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 7.5, |
|
"learning_rate": 5.346666666666667e-06, |
|
"loss": 0.8457, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 7.5, |
|
"eval_loss": 0.6772996187210083, |
|
"eval_runtime": 33.7458, |
|
"eval_samples_per_second": 8.416, |
|
"eval_steps_per_second": 1.067, |
|
"eval_wer": 0.34258177570093457, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 8.12, |
|
"learning_rate": 4.680000000000001e-06, |
|
"loss": 0.7614, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 8.12, |
|
"eval_loss": 0.6912708282470703, |
|
"eval_runtime": 33.9892, |
|
"eval_samples_per_second": 8.356, |
|
"eval_steps_per_second": 1.059, |
|
"eval_wer": 0.33440420560747663, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 8.75, |
|
"learning_rate": 4.013333333333334e-06, |
|
"loss": 0.8127, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 8.75, |
|
"eval_loss": 0.6827006340026855, |
|
"eval_runtime": 33.6998, |
|
"eval_samples_per_second": 8.427, |
|
"eval_steps_per_second": 1.068, |
|
"eval_wer": 0.33352803738317754, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 9.38, |
|
"learning_rate": 3.346666666666667e-06, |
|
"loss": 0.8443, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 9.38, |
|
"eval_loss": 0.6724790930747986, |
|
"eval_runtime": 34.0431, |
|
"eval_samples_per_second": 8.342, |
|
"eval_steps_per_second": 1.057, |
|
"eval_wer": 0.33557242990654207, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 2.68e-06, |
|
"loss": 0.7548, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_loss": 0.6758835315704346, |
|
"eval_runtime": 34.9833, |
|
"eval_samples_per_second": 8.118, |
|
"eval_steps_per_second": 1.029, |
|
"eval_wer": 0.3317757009345794, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 10.62, |
|
"learning_rate": 2.0133333333333337e-06, |
|
"loss": 0.7839, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 10.62, |
|
"eval_loss": 0.677266001701355, |
|
"eval_runtime": 34.4604, |
|
"eval_samples_per_second": 8.241, |
|
"eval_steps_per_second": 1.045, |
|
"eval_wer": 0.3285630841121495, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 11.25, |
|
"learning_rate": 1.3466666666666668e-06, |
|
"loss": 0.7912, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 11.25, |
|
"eval_loss": 0.6747676730155945, |
|
"eval_runtime": 35.0861, |
|
"eval_samples_per_second": 8.094, |
|
"eval_steps_per_second": 1.026, |
|
"eval_wer": 0.3285630841121495, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 11.88, |
|
"learning_rate": 6.800000000000001e-07, |
|
"loss": 0.8238, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 11.88, |
|
"eval_loss": 0.673457145690918, |
|
"eval_runtime": 33.7389, |
|
"eval_samples_per_second": 8.418, |
|
"eval_steps_per_second": 1.067, |
|
"eval_wer": 0.32973130841121495, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 12.5, |
|
"learning_rate": 1.3333333333333334e-08, |
|
"loss": 0.7618, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 12.5, |
|
"eval_loss": 0.672848641872406, |
|
"eval_runtime": 34.5736, |
|
"eval_samples_per_second": 8.214, |
|
"eval_steps_per_second": 1.041, |
|
"eval_wer": 0.3285630841121495, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 12.5, |
|
"step": 2000, |
|
"total_flos": 9.605345431463184e+18, |
|
"train_loss": 0.9391711463928223, |
|
"train_runtime": 9697.5717, |
|
"train_samples_per_second": 3.3, |
|
"train_steps_per_second": 0.206 |
|
} |
|
], |
|
"logging_steps": 100, |
|
"max_steps": 2000, |
|
"num_train_epochs": 13, |
|
"save_steps": 100, |
|
"total_flos": 9.605345431463184e+18, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|