{ "epoch": 4.0, "total_flos": 4.4722177046373335e+18, "train_loss": 0.03198626538376714, "train_runtime": 5538.163, "train_samples_per_second": 10.421, "train_steps_per_second": 0.651 }