{ "epoch": 1.0, "eval_loss": 3.290411949157715, "eval_mem_cpu_alloc_delta": 544768, "eval_mem_cpu_peaked_delta": 73728, "eval_mem_gpu_alloc_delta": 0, "eval_mem_gpu_peaked_delta": 2645388800, "eval_runtime": 803.942, "eval_samples": 28999, "eval_samples_per_second": 36.071, "init_mem_cpu_alloc_delta": -36622336, "init_mem_cpu_peaked_delta": 1313382400, "init_mem_gpu_alloc_delta": 1444470784, "init_mem_gpu_peaked_delta": 0, "perplexity": 26.853923828930338, "train_mem_cpu_alloc_delta": 596549632, "train_mem_cpu_peaked_delta": 0, "train_mem_gpu_alloc_delta": 4257896960, "train_mem_gpu_peaked_delta": 2961890816, "train_runtime": 4429.0691, "train_samples": 29667, "train_samples_per_second": 1.675 }