{ "epoch": 0.9999558635300348, "eval_accuracy": 0.4982767756352662, "eval_loss": 2.483206033706665, "eval_runtime": 6.8799, "eval_samples": 318, "eval_samples_per_second": 46.221, "eval_steps_per_second": 0.436, "perplexity": 11.979609949761807, "total_flos": 1.9775705361382638e+20, "train_loss": 2.636019475715982, "train_runtime": 23008.8845, "train_samples": 2900094, "train_samples_per_second": 126.042, "train_steps_per_second": 0.492 }