|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 29.357798165137616, |
|
"global_step": 3200, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 3.67, |
|
"learning_rate": 0.00023999999999999998, |
|
"loss": 5.0456, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 3.67, |
|
"eval_loss": 2.805786609649658, |
|
"eval_runtime": 214.876, |
|
"eval_samples_per_second": 7.665, |
|
"eval_wer": 1.0, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 7.34, |
|
"learning_rate": 0.0002675090252707581, |
|
"loss": 0.8437, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 7.34, |
|
"eval_loss": 0.437711238861084, |
|
"eval_runtime": 217.8287, |
|
"eval_samples_per_second": 7.561, |
|
"eval_wer": 0.5915636809314677, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 11.01, |
|
"learning_rate": 0.00022418772563176893, |
|
"loss": 0.2449, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 11.01, |
|
"eval_loss": 0.3937138020992279, |
|
"eval_runtime": 222.9363, |
|
"eval_samples_per_second": 7.388, |
|
"eval_wer": 0.5292615667449698, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 14.68, |
|
"learning_rate": 0.00018086642599277977, |
|
"loss": 0.1486, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 14.68, |
|
"eval_loss": 0.411156564950943, |
|
"eval_runtime": 224.0258, |
|
"eval_samples_per_second": 7.352, |
|
"eval_wer": 0.5094474517413952, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 18.35, |
|
"learning_rate": 0.00013754512635379062, |
|
"loss": 0.1077, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 18.35, |
|
"eval_loss": 0.41311565041542053, |
|
"eval_runtime": 224.2133, |
|
"eval_samples_per_second": 7.346, |
|
"eval_wer": 0.49474006740884485, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 22.02, |
|
"learning_rate": 9.422382671480144e-05, |
|
"loss": 0.0791, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 22.02, |
|
"eval_loss": 0.43790802359580994, |
|
"eval_runtime": 224.8995, |
|
"eval_samples_per_second": 7.323, |
|
"eval_wer": 0.48707997140230824, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 25.69, |
|
"learning_rate": 5.090252707581227e-05, |
|
"loss": 0.0722, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 25.69, |
|
"eval_loss": 0.4185827076435089, |
|
"eval_runtime": 222.949, |
|
"eval_samples_per_second": 7.387, |
|
"eval_wer": 0.46798079869267695, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 29.36, |
|
"learning_rate": 7.581227436823104e-06, |
|
"loss": 0.0601, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 29.36, |
|
"eval_loss": 0.41515499353408813, |
|
"eval_runtime": 225.7543, |
|
"eval_samples_per_second": 7.296, |
|
"eval_wer": 0.4620569911142886, |
|
"step": 3200 |
|
} |
|
], |
|
"max_steps": 3270, |
|
"num_train_epochs": 30, |
|
"total_flos": 1.260196128535726e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|