{ | |
"epoch": 0.9985974754558204, | |
"eval_accuracy": 0.8559900076029108, | |
"eval_loss": 0.65576171875, | |
"eval_runtime": 59.8715, | |
"eval_samples": 630, | |
"eval_samples_per_second": 10.523, | |
"eval_steps_per_second": 1.319, | |
"perplexity": 1.9266094931688238, | |
"total_flos": 1.3901992019623936e+17, | |
"train_loss": 0.5984635370947449, | |
"train_runtime": 5970.3946, | |
"train_samples": 8556, | |
"train_samples_per_second": 1.433, | |
"train_steps_per_second": 0.045 | |
} |