***** train metrics ***** epoch = 1.0 num_input_tokens_seen = 417873560 total_flos = 73823561GF train_loss = 1.0007 train_runtime = 6 days, 5:47:01.98 train_samples_per_second = 1.571 train_steps_per_second = 0.031