{ | |
"epoch": 1.0, | |
"eval_loss": 1.3428778648376465, | |
"eval_runtime": 2.0111, | |
"eval_samples": 100, | |
"eval_samples_per_second": 49.725, | |
"eval_steps_per_second": 1.989, | |
"perplexity": 3.830050026427415, | |
"train_loss": 1.9416432221974707, | |
"train_runtime": 74872.2082, | |
"train_samples": 500000, | |
"train_samples_per_second": 6.678, | |
"train_steps_per_second": 0.052 | |
} |