{ "all_params": 61096448, "epoch": 3.0, "memory_footprint": 244385792, "total_flos": 361674414489600.0, "train_loss": 2.1775987458951547, "train_runtime": 101.4394, "train_samples_per_second": 25.996, "train_steps_per_second": 3.253, "trainable_params": 589824, "trainable_params_percent": 0.9653981848502878 }