hugodk-sch's picture
End of training
396c528 verified
raw
history blame
No virus
574 Bytes
{
"epoch": 1.0,
"eval_logits/chosen": -2.805530071258545,
"eval_logits/rejected": -2.802974224090576,
"eval_logps/chosen": -31.315858840942383,
"eval_logps/rejected": -34.838993072509766,
"eval_loss": 6.074533939361572,
"eval_rewards/accuracies": 0.5660299062728882,
"eval_rewards/chosen": -0.006680913269519806,
"eval_rewards/margins": 0.021486198529601097,
"eval_rewards/rejected": -0.0281671155244112,
"eval_runtime": 112.8101,
"eval_samples": 343,
"eval_samples_per_second": 3.041,
"eval_steps_per_second": 0.381
}