File size: 2,356 Bytes
e30beec f7749a6 7aeaae7 f7749a6 e30beec f05059c 7aeaae7 f05059c e30beec f05059c e30beec 7aeaae7 f05059c 7aeaae7 f05059c 7aeaae7 f05059c 7aeaae7 f05059c 7aeaae7 8d3381d f05059c 53ddeb5 f7749a6 e30beec 7aeaae7 e30beec 7aeaae7 e30beec f05059c e30beec f7749a6 7aeaae7 e30beec |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.026905829596412557,
"eval_steps": 3,
"global_step": 6,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.004484304932735426,
"grad_norm": 0.006755814887583256,
"learning_rate": 2e-05,
"loss": 11.9309,
"step": 1
},
{
"epoch": 0.004484304932735426,
"eval_loss": 11.931302070617676,
"eval_runtime": 0.5278,
"eval_samples_per_second": 1422.827,
"eval_steps_per_second": 89.045,
"step": 1
},
{
"epoch": 0.008968609865470852,
"grad_norm": 0.008150096982717514,
"learning_rate": 4e-05,
"loss": 11.9311,
"step": 2
},
{
"epoch": 0.013452914798206279,
"grad_norm": 0.00839826837182045,
"learning_rate": 6e-05,
"loss": 11.9313,
"step": 3
},
{
"epoch": 0.013452914798206279,
"eval_loss": 11.931297302246094,
"eval_runtime": 0.521,
"eval_samples_per_second": 1441.543,
"eval_steps_per_second": 90.216,
"step": 3
},
{
"epoch": 0.017937219730941704,
"grad_norm": 0.007786044850945473,
"learning_rate": 8e-05,
"loss": 11.9324,
"step": 4
},
{
"epoch": 0.02242152466367713,
"grad_norm": 0.009498490951955318,
"learning_rate": 0.0001,
"loss": 11.9317,
"step": 5
},
{
"epoch": 0.026905829596412557,
"grad_norm": 0.008360755629837513,
"learning_rate": 0.00012,
"loss": 11.9318,
"step": 6
},
{
"epoch": 0.026905829596412557,
"eval_loss": 11.931273460388184,
"eval_runtime": 0.5165,
"eval_samples_per_second": 1454.119,
"eval_steps_per_second": 91.003,
"step": 6
}
],
"logging_steps": 1,
"max_steps": 10,
"num_input_tokens_seen": 0,
"num_train_epochs": 1,
"save_steps": 3,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 5789908992.0,
"train_batch_size": 2,
"trial_name": null,
"trial_params": null
}
|