longformer-simple / checkpoint-41 /trainer_state.json
Theoreticallyhugo's picture
Training in progress, epoch 1, checkpoint
04c7cff verified
raw
history blame
1.78 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 1.0,
"eval_steps": 500,
"global_step": 41,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_Claim": {
"f1-score": 0.3472626289341444,
"precision": 0.3978787878787879,
"recall": 0.3080713280150164,
"support": 4262.0
},
"eval_MajorClaim": {
"f1-score": 0.5334239746204397,
"precision": 0.5235765124555161,
"recall": 0.54364896073903,
"support": 2165.0
},
"eval_O": {
"f1-score": 0.8390533194223273,
"precision": 0.9157377442167086,
"recall": 0.7742197000405351,
"support": 9868.0
},
"eval_Premise": {
"f1-score": 0.8562600940945159,
"precision": 0.7896134170821731,
"recall": 0.9351944167497508,
"support": 13039.0
},
"eval_accuracy": 0.7610281584509443,
"eval_loss": 0.6209574341773987,
"eval_macro avg": {
"f1-score": 0.6440000042678569,
"precision": 0.6567016154082965,
"recall": 0.6402836013860831,
"support": 29334.0
},
"eval_runtime": 1.3904,
"eval_samples_per_second": 57.539,
"eval_steps_per_second": 7.192,
"eval_weighted avg": {
"f1-score": 0.7526914076678427,
"precision": 0.7554909643645776,
"recall": 0.7610281584509443,
"support": 29334.0
},
"step": 41
}
],
"logging_steps": 500,
"max_steps": 656,
"num_input_tokens_seen": 0,
"num_train_epochs": 16,
"save_steps": 500,
"total_flos": 143788732726800.0,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}