{ | |
"epoch": 0.9999558635300348, | |
"eval_accuracy": 0.515515162684974, | |
"eval_loss": 2.3370444774627686, | |
"eval_runtime": 7.4574, | |
"eval_samples": 318, | |
"eval_samples_per_second": 42.642, | |
"eval_steps_per_second": 0.402, | |
"perplexity": 10.350599880110575, | |
"total_flos": 2.234940544568441e+20, | |
"train_loss": 2.49364670185046, | |
"train_runtime": 28476.6031, | |
"train_samples": 2900094, | |
"train_samples_per_second": 101.841, | |
"train_steps_per_second": 0.398 | |
} |