ap-normistral-7b-align-scan / eval_results.json
hugodk-sch's picture
End of training
e33c89a verified
raw
history blame
565 Bytes
{
"epoch": 1.0,
"eval_logits/chosen": 98.7645034790039,
"eval_logits/rejected": 98.74665832519531,
"eval_logps/chosen": -32.56877517700195,
"eval_logps/rejected": -36.22236251831055,
"eval_loss": 0.7821906208992004,
"eval_rewards/accuracies": 0.52491694688797,
"eval_rewards/chosen": -0.10047715157270432,
"eval_rewards/margins": 0.1041894406080246,
"eval_rewards/rejected": -0.20466658473014832,
"eval_runtime": 103.6205,
"eval_samples": 343,
"eval_samples_per_second": 3.31,
"eval_steps_per_second": 0.415
}