{"final_train_loss": 0.7964469194412231, "best_val_loss": 1.4783154726028442, "total_train_time": 99.80931115150452, "avg_inference_tokens_per_second": 602.1653151988776}