{ | |
"epoch": 0.9999558635300348, | |
"eval_accuracy": 0.5067761728139086, | |
"eval_loss": 2.4069583415985107, | |
"eval_runtime": 36.3165, | |
"eval_samples": 318, | |
"eval_samples_per_second": 8.756, | |
"eval_steps_per_second": 0.083, | |
"perplexity": 11.100146890382385, | |
"total_flos": 2.202782600225295e+20, | |
"train_loss": 2.5603223798301933, | |
"train_runtime": 24610.1089, | |
"train_samples": 2900094, | |
"train_samples_per_second": 117.842, | |
"train_steps_per_second": 0.46 | |
} |