{ "epoch": 8.0, "total_flos": 1.85717836136448e+16, "train_loss": 0.5860137939453125, "train_runtime": 10564.8969, "train_samples_per_second": 12.523, "train_steps_per_second": 0.392 }