olivia-7b-dpo-lora-v2 / all_results.json
prd-nguyenvo's picture
Model save
04489e5
raw
history blame
741 Bytes
{
"epoch": 1.99,
"eval_logits/chosen": -2.5726864337921143,
"eval_logits/rejected": -2.556718587875366,
"eval_logps/chosen": -85.11767578125,
"eval_logps/rejected": -133.85464477539062,
"eval_loss": 0.12992651760578156,
"eval_rewards/accuracies": 0.9520547986030579,
"eval_rewards/chosen": -2.199751138687134,
"eval_rewards/margins": 4.689663887023926,
"eval_rewards/rejected": -6.889414310455322,
"eval_runtime": 288.3554,
"eval_samples": 876,
"eval_samples_per_second": 3.038,
"eval_steps_per_second": 3.038,
"train_loss": 0.20939183043777396,
"train_runtime": 5162.9911,
"train_samples": 3505,
"train_samples_per_second": 1.358,
"train_steps_per_second": 0.042
}