{ "epoch": 0.9999558635300348, "eval_accuracy": 0.5114566774944134, "eval_loss": 2.3657422065734863, "eval_runtime": 6.976, "eval_samples": 318, "eval_samples_per_second": 45.585, "eval_steps_per_second": 0.43, "perplexity": 10.651941825558275, "total_flos": 2.202782600225295e+20, "train_loss": 2.520355888510828, "train_runtime": 24592.232, "train_samples": 2900094, "train_samples_per_second": 117.927, "train_steps_per_second": 0.461 }