{ "best_metric": null, "best_model_checkpoint": null, "epoch": 7.407407407407407, "global_step": 600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.23, "learning_rate": 0.0001, "loss": 0.0625, "step": 100 }, { "epoch": 1.23, "eval_loss": 0.28051668405532837, "eval_runtime": 198.6071, "eval_samples_per_second": 16.374, "eval_steps_per_second": 2.049, "eval_wer": 0.2381097005406062, "step": 100 }, { "epoch": 2.47, "learning_rate": 9.987639060568604e-05, "loss": 0.047, "step": 200 }, { "epoch": 2.47, "eval_loss": 0.34423157572746277, "eval_runtime": 147.7154, "eval_samples_per_second": 22.015, "eval_steps_per_second": 2.755, "eval_wer": 0.2334325457085586, "step": 200 }, { "epoch": 3.7, "learning_rate": 9.975278121137207e-05, "loss": 0.0409, "step": 300 }, { "epoch": 3.7, "eval_loss": 0.3597787916660309, "eval_runtime": 156.092, "eval_samples_per_second": 20.834, "eval_steps_per_second": 2.607, "eval_wer": 0.23124582396889995, "step": 300 }, { "epoch": 4.94, "learning_rate": 9.96291718170581e-05, "loss": 0.0413, "step": 400 }, { "epoch": 4.94, "eval_loss": 0.35860675573349, "eval_runtime": 151.5312, "eval_samples_per_second": 21.461, "eval_steps_per_second": 2.686, "eval_wer": 0.2421794326671931, "step": 400 }, { "epoch": 6.17, "learning_rate": 9.950556242274414e-05, "loss": 0.0388, "step": 500 }, { "epoch": 6.17, "eval_loss": 0.3748931586742401, "eval_runtime": 154.1563, "eval_samples_per_second": 21.095, "eval_steps_per_second": 2.64, "eval_wer": 0.23914231913988945, "step": 500 }, { "epoch": 7.41, "learning_rate": 9.938195302843017e-05, "loss": 0.0383, "step": 600 }, { "epoch": 7.41, "eval_loss": 0.36109668016433716, "eval_runtime": 163.2656, "eval_samples_per_second": 19.918, "eval_steps_per_second": 2.493, "eval_wer": 0.2352548138249408, "step": 600 } ], "max_steps": 81000, "num_train_epochs": 1000, "total_flos": 1.9144703855961313e+19, "trial_name": null, "trial_params": null }