{"final_train_loss": 0.8173830509185791, "best_val_loss": 1.4637625217437744, "total_train_time": 92.05195260047913, "avg_inference_tokens_per_second": 697.3658396135052} |
{"final_train_loss": 0.8173830509185791, "best_val_loss": 1.4637625217437744, "total_train_time": 92.05195260047913, "avg_inference_tokens_per_second": 697.3658396135052} |