|
{ |
|
"best_metric": 0.830047070980072, |
|
"best_model_checkpoint": "./output/clip-finetuned-csu-p14-336-e4l57-l/checkpoint-2500", |
|
"epoch": 0.2814364516492176, |
|
"eval_steps": 500, |
|
"global_step": 2500, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.056287290329843524, |
|
"grad_norm": 150.1642303466797, |
|
"learning_rate": 4.929640887087696e-07, |
|
"loss": 0.3486, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.056287290329843524, |
|
"eval_loss": 1.1265727281570435, |
|
"eval_runtime": 123.7806, |
|
"eval_samples_per_second": 15.948, |
|
"eval_steps_per_second": 1.995, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.11257458065968705, |
|
"grad_norm": 366.6913146972656, |
|
"learning_rate": 4.859281774175391e-07, |
|
"loss": 0.2733, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.11257458065968705, |
|
"eval_loss": 0.9742079377174377, |
|
"eval_runtime": 125.8047, |
|
"eval_samples_per_second": 15.691, |
|
"eval_steps_per_second": 1.963, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.16886187098953057, |
|
"grad_norm": 555.5016479492188, |
|
"learning_rate": 4.788922661263087e-07, |
|
"loss": 0.1851, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.16886187098953057, |
|
"eval_loss": 0.9162159562110901, |
|
"eval_runtime": 126.7606, |
|
"eval_samples_per_second": 15.573, |
|
"eval_steps_per_second": 1.949, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.2251491613193741, |
|
"grad_norm": 0.423260897397995, |
|
"learning_rate": 4.7185635483507824e-07, |
|
"loss": 0.1973, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.2251491613193741, |
|
"eval_loss": 0.8716973662376404, |
|
"eval_runtime": 127.6955, |
|
"eval_samples_per_second": 15.459, |
|
"eval_steps_per_second": 1.934, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.2814364516492176, |
|
"grad_norm": 6.840139389038086, |
|
"learning_rate": 4.6482044354384774e-07, |
|
"loss": 0.1881, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.2814364516492176, |
|
"eval_loss": 0.830047070980072, |
|
"eval_runtime": 128.0771, |
|
"eval_samples_per_second": 15.413, |
|
"eval_steps_per_second": 1.929, |
|
"step": 2500 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 35532, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 4, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": false |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 900115394852520.0, |
|
"train_batch_size": 2, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|