epoch = 3.0 train_loss = 0.3734229371761423 train_runtime = 2422.1302 train_samples_per_second = 341.354 train_steps_per_second = 2.667