Llama-3-8B-Magpie-Align-v0.3 / all_results.json
flydust's picture
End of training
22e6a31 verified
raw
history blame
No virus
770 Bytes
{
"epoch": 0.9981298423724285,
"eval_logits/chosen": -1.1332677602767944,
"eval_logits/rejected": -1.1544803380966187,
"eval_logps/chosen": -715.691650390625,
"eval_logps/rejected": -871.3291625976562,
"eval_loss": 0.38531965017318726,
"eval_rewards/accuracies": 0.875,
"eval_rewards/chosen": -4.425616264343262,
"eval_rewards/margins": 1.6173373460769653,
"eval_rewards/rejected": -6.0429534912109375,
"eval_runtime": 126.4968,
"eval_samples": 1961,
"eval_samples_per_second": 15.502,
"eval_steps_per_second": 0.49,
"total_flos": 0.0,
"train_loss": 0.4754098514673286,
"train_runtime": 9903.4254,
"train_samples": 59875,
"train_samples_per_second": 6.046,
"train_steps_per_second": 0.047
}