|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 26.314754098360655, |
|
"global_step": 3000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.31, |
|
"learning_rate": 9.99957013773138e-06, |
|
"loss": 0.029, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 2.63, |
|
"learning_rate": 9.998254232827442e-06, |
|
"loss": 0.0249, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 3.94, |
|
"learning_rate": 9.996938327923503e-06, |
|
"loss": 0.0239, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 5.26, |
|
"learning_rate": 9.995622423019565e-06, |
|
"loss": 0.0223, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 6.58, |
|
"learning_rate": 9.994306518115625e-06, |
|
"loss": 0.0219, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 7.89, |
|
"learning_rate": 9.992990613211686e-06, |
|
"loss": 0.0215, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 8.77, |
|
"eval_loss": 0.21139128506183624, |
|
"eval_runtime": 432.0782, |
|
"eval_samples_per_second": 9.443, |
|
"eval_steps_per_second": 1.18, |
|
"eval_wer": 0.1666585139167441, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 9.21, |
|
"learning_rate": 9.991674708307746e-06, |
|
"loss": 0.0207, |
|
"step": 1050 |
|
}, |
|
{ |
|
"epoch": 10.52, |
|
"learning_rate": 9.990358803403808e-06, |
|
"loss": 0.0209, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 11.84, |
|
"learning_rate": 9.989042898499869e-06, |
|
"loss": 0.0193, |
|
"step": 1350 |
|
}, |
|
{ |
|
"epoch": 13.16, |
|
"learning_rate": 9.98772699359593e-06, |
|
"loss": 0.02, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 14.47, |
|
"learning_rate": 9.986411088691991e-06, |
|
"loss": 0.0191, |
|
"step": 1650 |
|
}, |
|
{ |
|
"epoch": 15.79, |
|
"learning_rate": 9.985095183788054e-06, |
|
"loss": 0.0189, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 17.1, |
|
"learning_rate": 9.983779278884114e-06, |
|
"loss": 0.0185, |
|
"step": 1950 |
|
}, |
|
{ |
|
"epoch": 17.54, |
|
"eval_loss": 0.2301694005727768, |
|
"eval_runtime": 231.0348, |
|
"eval_samples_per_second": 17.66, |
|
"eval_steps_per_second": 2.207, |
|
"eval_wer": 0.16558235092696766, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 18.42, |
|
"learning_rate": 9.982463373980174e-06, |
|
"loss": 0.0184, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 19.73, |
|
"learning_rate": 9.981147469076235e-06, |
|
"loss": 0.0186, |
|
"step": 2250 |
|
}, |
|
{ |
|
"epoch": 21.05, |
|
"learning_rate": 9.979831564172297e-06, |
|
"loss": 0.0174, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 22.37, |
|
"learning_rate": 9.978515659268357e-06, |
|
"loss": 0.0175, |
|
"step": 2550 |
|
}, |
|
{ |
|
"epoch": 23.68, |
|
"learning_rate": 9.977199754364418e-06, |
|
"loss": 0.0169, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"learning_rate": 9.97588384946048e-06, |
|
"loss": 0.0174, |
|
"step": 2850 |
|
}, |
|
{ |
|
"epoch": 26.31, |
|
"learning_rate": 9.974567944556542e-06, |
|
"loss": 0.0175, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 26.31, |
|
"eval_loss": 0.23709918558597565, |
|
"eval_runtime": 224.4917, |
|
"eval_samples_per_second": 18.174, |
|
"eval_steps_per_second": 2.272, |
|
"eval_wer": 0.16504426943207945, |
|
"step": 3000 |
|
} |
|
], |
|
"max_steps": 1140000, |
|
"num_train_epochs": 10000, |
|
"total_flos": 8.535940964167849e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|