|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 59.991596638655466, |
|
"global_step": 3540, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 5.08, |
|
"learning_rate": 0.0003546, |
|
"loss": 6.338, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 5.08, |
|
"eval_loss": 3.1361563205718994, |
|
"eval_runtime": 51.9297, |
|
"eval_samples_per_second": 12.632, |
|
"eval_wer": 1.0, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 10.17, |
|
"learning_rate": 0.0005715592105263158, |
|
"loss": 3.1258, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 10.17, |
|
"eval_loss": 3.0660765171051025, |
|
"eval_runtime": 50.6635, |
|
"eval_samples_per_second": 12.948, |
|
"eval_wer": 1.0, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 15.25, |
|
"learning_rate": 0.0005132368421052633, |
|
"loss": 1.4079, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 15.25, |
|
"eval_loss": 0.5029116272926331, |
|
"eval_runtime": 51.4993, |
|
"eval_samples_per_second": 12.738, |
|
"eval_wer": 0.6116052520118593, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 20.34, |
|
"learning_rate": 0.00045491447368421056, |
|
"loss": 0.1446, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 20.34, |
|
"eval_loss": 0.5113032460212708, |
|
"eval_runtime": 51.276, |
|
"eval_samples_per_second": 12.794, |
|
"eval_wer": 0.5307073274036426, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 25.42, |
|
"learning_rate": 0.0003965921052631579, |
|
"loss": 0.0714, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 25.42, |
|
"eval_loss": 0.5406283140182495, |
|
"eval_runtime": 51.4595, |
|
"eval_samples_per_second": 12.748, |
|
"eval_wer": 0.5006353240152478, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 30.5, |
|
"learning_rate": 0.00033826973684210527, |
|
"loss": 0.0459, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 30.5, |
|
"eval_loss": 0.5775919556617737, |
|
"eval_runtime": 51.4074, |
|
"eval_samples_per_second": 12.761, |
|
"eval_wer": 0.49767047861075814, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 35.59, |
|
"learning_rate": 0.0002799473684210526, |
|
"loss": 0.0372, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 35.59, |
|
"eval_loss": 0.5846429467201233, |
|
"eval_runtime": 51.8427, |
|
"eval_samples_per_second": 12.654, |
|
"eval_wer": 0.4805167301990682, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 40.67, |
|
"learning_rate": 0.00022162500000000003, |
|
"loss": 0.0297, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 40.67, |
|
"eval_loss": 0.5748910903930664, |
|
"eval_runtime": 51.453, |
|
"eval_samples_per_second": 12.75, |
|
"eval_wer": 0.4841168996188056, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 45.76, |
|
"learning_rate": 0.0001633026315789474, |
|
"loss": 0.0254, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 45.76, |
|
"eval_loss": 0.592321515083313, |
|
"eval_runtime": 51.3943, |
|
"eval_samples_per_second": 12.764, |
|
"eval_wer": 0.4614570097416349, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 50.84, |
|
"learning_rate": 0.00010498026315789474, |
|
"loss": 0.0198, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 50.84, |
|
"eval_loss": 0.5621945261955261, |
|
"eval_runtime": 51.5882, |
|
"eval_samples_per_second": 12.716, |
|
"eval_wer": 0.4404913172384583, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 55.92, |
|
"learning_rate": 4.665789473684211e-05, |
|
"loss": 0.0193, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 55.92, |
|
"eval_loss": 0.5657602548599243, |
|
"eval_runtime": 71.8217, |
|
"eval_samples_per_second": 9.134, |
|
"eval_wer": 0.4470563320626853, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 59.99, |
|
"step": 3540, |
|
"total_flos": 3.4970554953107223e+19, |
|
"train_runtime": 23737.912, |
|
"train_samples_per_second": 0.149 |
|
} |
|
], |
|
"max_steps": 3540, |
|
"num_train_epochs": 60, |
|
"total_flos": 3.4970554953107223e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|