{ "epoch": 0.9999558635300348, "eval_accuracy": 0.4989978574884235, "eval_loss": 2.5016486644744873, "eval_runtime": 73.2986, "eval_samples": 318, "eval_samples_per_second": 4.338, "eval_steps_per_second": 0.041, "perplexity": 12.20259537139486, "total_flos": 2.234940544568441e+20, "train_loss": 2.6672301666211276, "train_runtime": 28535.6383, "train_samples": 2900094, "train_samples_per_second": 101.631, "train_steps_per_second": 0.397 }