sfulay's picture
End of training
62601f5 verified
raw
history blame contribute delete
558 Bytes
{
"epoch": 1.0,
"eval_logits/chosen": 2.193073272705078,
"eval_logits/rejected": 3.0313031673431396,
"eval_logps/chosen": -469.1545104980469,
"eval_logps/rejected": -617.989501953125,
"eval_loss": 0.5419281721115112,
"eval_rewards/accuracies": 0.78125,
"eval_rewards/chosen": -2.0652458667755127,
"eval_rewards/margins": 1.4880279302597046,
"eval_rewards/rejected": -3.5532736778259277,
"eval_runtime": 103.7243,
"eval_samples": 2000,
"eval_samples_per_second": 19.282,
"eval_steps_per_second": 0.309
}