{ "best_metric": null, "best_model_checkpoint": null, "epoch": 17.752260397830018, "global_step": 2450, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.72, "learning_rate": 1e-05, "loss": 0.0194, "step": 100 }, { "epoch": 1.45, "learning_rate": 9.99927530980506e-06, "loss": 0.0174, "step": 200 }, { "epoch": 2.17, "learning_rate": 9.998550619610118e-06, "loss": 0.0197, "step": 300 }, { "epoch": 2.54, "eval_loss": 0.2245764136314392, "eval_runtime": 322.1745, "eval_samples_per_second": 12.251, "eval_steps_per_second": 1.533, "eval_wer": 0.17368103101087395, "step": 350 }, { "epoch": 2.9, "learning_rate": 9.997825929415176e-06, "loss": 0.0205, "step": 400 }, { "epoch": 3.62, "learning_rate": 9.997108486122183e-06, "loss": 0.0199, "step": 500 }, { "epoch": 4.35, "learning_rate": 9.996383795927241e-06, "loss": 0.0198, "step": 600 }, { "epoch": 5.07, "learning_rate": 9.9956591057323e-06, "loss": 0.0193, "step": 700 }, { "epoch": 5.07, "eval_loss": 0.23122623562812805, "eval_runtime": 209.3421, "eval_samples_per_second": 18.854, "eval_steps_per_second": 2.36, "eval_wer": 0.17217076117599678, "step": 700 }, { "epoch": 5.8, "learning_rate": 9.994934415537358e-06, "loss": 0.0186, "step": 800 }, { "epoch": 6.52, "learning_rate": 9.994209725342417e-06, "loss": 0.0194, "step": 900 }, { "epoch": 7.25, "learning_rate": 9.993485035147475e-06, "loss": 0.0186, "step": 1000 }, { "epoch": 7.61, "eval_loss": 0.2398330122232437, "eval_runtime": 209.0, "eval_samples_per_second": 18.885, "eval_steps_per_second": 2.364, "eval_wer": 0.17232178815948448, "step": 1050 }, { "epoch": 7.97, "learning_rate": 9.992760344952534e-06, "loss": 0.0186, "step": 1100 }, { "epoch": 8.69, "learning_rate": 9.99203565475759e-06, "loss": 0.0191, "step": 1200 }, { "epoch": 9.42, "learning_rate": 9.991310964562651e-06, "loss": 0.0185, "step": 1300 }, { "epoch": 10.14, "learning_rate": 9.990586274367708e-06, "loss": 0.0171, "step": 1400 }, { "epoch": 10.14, "eval_loss": 0.24630184471607208, "eval_runtime": 212.2032, "eval_samples_per_second": 18.6, "eval_steps_per_second": 2.328, "eval_wer": 0.17020741039065646, "step": 1400 }, { "epoch": 10.87, "learning_rate": 9.989861584172766e-06, "loss": 0.0176, "step": 1500 }, { "epoch": 11.59, "learning_rate": 9.989136893977825e-06, "loss": 0.018, "step": 1600 }, { "epoch": 12.32, "learning_rate": 9.988412203782883e-06, "loss": 0.0172, "step": 1700 }, { "epoch": 12.68, "eval_loss": 0.24790118634700775, "eval_runtime": 215.9062, "eval_samples_per_second": 18.281, "eval_steps_per_second": 2.288, "eval_wer": 0.17081151832460734, "step": 1750 }, { "epoch": 13.04, "learning_rate": 9.987687513587942e-06, "loss": 0.0172, "step": 1800 }, { "epoch": 13.77, "learning_rate": 9.986962823393e-06, "loss": 0.0165, "step": 1900 }, { "epoch": 14.49, "learning_rate": 9.986238133198059e-06, "loss": 0.0176, "step": 2000 }, { "epoch": 15.22, "learning_rate": 9.985513443003117e-06, "loss": 0.0173, "step": 2100 }, { "epoch": 15.22, "eval_loss": 0.24780623614788055, "eval_runtime": 215.4375, "eval_samples_per_second": 18.321, "eval_steps_per_second": 2.293, "eval_wer": 0.17015706806282724, "step": 2100 }, { "epoch": 15.94, "learning_rate": 9.984788752808176e-06, "loss": 0.0168, "step": 2200 }, { "epoch": 16.67, "learning_rate": 9.984064062613234e-06, "loss": 0.0165, "step": 2300 }, { "epoch": 17.39, "learning_rate": 9.983339372418293e-06, "loss": 0.0169, "step": 2400 }, { "epoch": 17.75, "eval_loss": 0.24955050647258759, "eval_runtime": 224.6408, "eval_samples_per_second": 17.57, "eval_steps_per_second": 2.199, "eval_wer": 0.1689488521949255, "step": 2450 } ], "max_steps": 1380000, "num_train_epochs": 10000, "total_flos": 5.57531310441053e+19, "trial_name": null, "trial_params": null }