sfulay's picture
End of training
1ea383f verified
raw
history blame contribute delete
774 Bytes
{
"epoch": 0.9965156794425087,
"eval_logits/chosen": -2.396684169769287,
"eval_logits/rejected": -2.352323055267334,
"eval_logps/chosen": -293.2704772949219,
"eval_logps/rejected": -318.3273010253906,
"eval_loss": 0.6241225600242615,
"eval_rewards/accuracies": 0.6953125,
"eval_rewards/chosen": -0.3064056634902954,
"eval_rewards/margins": 0.2502462863922119,
"eval_rewards/rejected": -0.5566520094871521,
"eval_runtime": 104.8654,
"eval_samples": 2000,
"eval_samples_per_second": 19.072,
"eval_steps_per_second": 0.305,
"total_flos": 0.0,
"train_loss": 0.6510118654557875,
"train_runtime": 3809.3826,
"train_samples": 18340,
"train_samples_per_second": 4.814,
"train_steps_per_second": 0.038
}