{ "all_params": 223193728, "epoch": 5.0, "memory_footprint": 892774912, "total_flos": 4146070071306240.0, "train_loss": 1.9703198982044563, "train_runtime": 950.7032, "train_samples_per_second": 4.623, "train_steps_per_second": 4.623, "trainable_params": 290176, "trainable_params_percent": 0.13001082180947307 }