zephyr-ds / eval_results.json
jikaixuan's picture
Training in progress, epoch 0
cf31064 verified
raw
history blame
578 Bytes
{
"epoch": 1.0,
"eval_logits/chosen": -2.4944536685943604,
"eval_logits/rejected": -2.4963433742523193,
"eval_logps/chosen": -269.25555419921875,
"eval_logps/rejected": -253.21238708496094,
"eval_loss": 0.6399702429771423,
"eval_rewards/accuracies": 0.6370000243186951,
"eval_rewards/chosen": 0.030110126361250877,
"eval_rewards/margins": 0.05743245780467987,
"eval_rewards/rejected": -0.027322327718138695,
"eval_runtime": 803.6977,
"eval_samples": 2000,
"eval_samples_per_second": 2.488,
"eval_steps_per_second": 0.311
}