{ "best_metric": null, "best_model_checkpoint": null, "epoch": 12.0, "eval_steps": 500, "global_step": 492, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_B": { "f1-score": 0.6054590570719602, "precision": 0.8472222222222222, "recall": 0.47104247104247104, "support": 1295.0 }, "eval_I": { "f1-score": 0.9281628372580799, "precision": 0.8894522863277146, "recall": 0.9703962123099925, "support": 20065.0 }, "eval_O": { "f1-score": 0.826809241932404, "precision": 0.8983402489626556, "recall": 0.7658295012380616, "support": 8481.0 }, "eval_accuracy": 0.8905867765825543, "eval_loss": 0.3152744174003601, "eval_macro avg": { "f1-score": 0.786810378754148, "precision": 0.8783382525041974, "recall": 0.735756061530175, "support": 29841.0 }, "eval_runtime": 1.3493, "eval_samples_per_second": 59.291, "eval_steps_per_second": 7.411, "eval_weighted avg": { "f1-score": 0.8853532384745914, "precision": 0.8901456571293072, "recall": 0.8905867765825543, "support": 29841.0 }, "step": 41 }, { "epoch": 2.0, "eval_B": { "f1-score": 0.8510791366906474, "precision": 0.7966329966329966, "recall": 0.9135135135135135, "support": 1295.0 }, "eval_I": { "f1-score": 0.9477035236938031, "precision": 0.9247806497510078, "recall": 0.9717916770495888, "support": 20065.0 }, "eval_O": { "f1-score": 0.8622397155916709, "precision": 0.9339843212763032, "recall": 0.8007310458672326, "support": 8481.0 }, "eval_accuracy": 0.9206460909486948, "eval_loss": 0.22530655562877655, "eval_macro avg": { "f1-score": 0.8870074586587071, "precision": 0.8851326558867693, "recall": 0.895345412143445, "support": 29841.0 }, "eval_runtime": 1.356, "eval_samples_per_second": 58.999, "eval_steps_per_second": 7.375, "eval_weighted avg": { "f1-score": 0.9192209950358067, "precision": 0.9218352098333846, "recall": 0.9206460909486948, "support": 29841.0 }, "step": 82 }, { "epoch": 3.0, "eval_B": { "f1-score": 0.8718693284936478, "precision": 0.8226027397260274, "recall": 0.9274131274131274, "support": 1295.0 }, "eval_I": { "f1-score": 0.95727385377943, "precision": 0.9520828198175992, "recall": 0.9625218041365562, "support": 20065.0 }, "eval_O": { "f1-score": 0.8947336671291549, "precision": 0.91600790513834, "recall": 0.8744251857092324, "support": 8481.0 }, "eval_accuracy": 0.9359605911330049, "eval_loss": 0.18091395497322083, "eval_macro avg": { "f1-score": 0.9079589498007442, "precision": 0.8968978215606556, "recall": 0.9214533724196388, "support": 29841.0 }, "eval_runtime": 1.3616, "eval_samples_per_second": 58.756, "eval_steps_per_second": 7.344, "eval_weighted avg": { "f1-score": 0.9357932672298482, "precision": 0.9362110978540797, "recall": 0.9359605911330049, "support": 29841.0 }, "step": 123 }, { "epoch": 4.0, "eval_B": { "f1-score": 0.8863383931877082, "precision": 0.8513513513513513, "recall": 0.9243243243243243, "support": 1295.0 }, "eval_I": { "f1-score": 0.9597514129823103, "precision": 0.942660770931462, "recall": 0.9774732120608024, "support": 20065.0 }, "eval_O": { "f1-score": 0.8954686530105526, "precision": 0.9454712282081531, "recall": 0.8504893290885509, "support": 8481.0 }, "eval_accuracy": 0.9390771086759827, "eval_loss": 0.19618020951747894, "eval_macro avg": { "f1-score": 0.913852819726857, "precision": 0.9131611168303221, "recall": 0.9174289551578925, "support": 29841.0 }, "eval_runtime": 1.355, "eval_samples_per_second": 59.041, "eval_steps_per_second": 7.38, "eval_weighted avg": { "f1-score": 0.9382959675228925, "precision": 0.9394969959174669, "recall": 0.9390771086759827, "support": 29841.0 }, "step": 164 }, { "epoch": 5.0, "eval_B": { "f1-score": 0.8794862108046846, "precision": 0.8609467455621301, "recall": 0.8988416988416988, "support": 1295.0 }, "eval_I": { "f1-score": 0.955187788105494, "precision": 0.9656717938270347, "recall": 0.9449289808123599, "support": 20065.0 }, "eval_O": { "f1-score": 0.8953622519612366, "precision": 0.8764539808018069, "recall": 0.9151043509020163, "support": 8481.0 }, "eval_accuracy": 0.9344525987734995, "eval_loss": 0.1936398446559906, "eval_macro avg": { "f1-score": 0.9100120836238051, "precision": 0.9010241733969906, "recall": 0.9196250101853582, "support": 29841.0 }, "eval_runtime": 1.3533, "eval_samples_per_second": 59.115, "eval_steps_per_second": 7.389, "eval_weighted avg": { "f1-score": 0.9348997979361299, "precision": 0.9357708116290517, "recall": 0.9344525987734995, "support": 29841.0 }, "step": 205 }, { "epoch": 6.0, "eval_B": { "f1-score": 0.8813928182807399, "precision": 0.8310533515731874, "recall": 0.9382239382239382, "support": 1295.0 }, "eval_I": { "f1-score": 0.9576389581878055, "precision": 0.958739197762126, "recall": 0.9565412409668577, "support": 20065.0 }, "eval_O": { "f1-score": 0.8994715278190131, "precision": 0.9059808612440191, "recall": 0.8930550642612899, "support": 8481.0 }, "eval_accuracy": 0.9377031600817667, "eval_loss": 0.19472843408584595, "eval_macro avg": { "f1-score": 0.9128344347625195, "precision": 0.8985911368597775, "recall": 0.9292734144840287, "support": 29841.0 }, "eval_runtime": 1.351, "eval_samples_per_second": 59.216, "eval_steps_per_second": 7.402, "eval_weighted avg": { "f1-score": 0.9377985799116962, "precision": 0.9382038060921168, "recall": 0.9377031600817667, "support": 29841.0 }, "step": 246 }, { "epoch": 7.0, "eval_B": { "f1-score": 0.8952959028831563, "precision": 0.8799403430275914, "recall": 0.9111969111969112, "support": 1295.0 }, "eval_I": { "f1-score": 0.9592318906147891, "precision": 0.9675979919882359, "recall": 0.9510092200348866, "support": 20065.0 }, "eval_O": { "f1-score": 0.9041714947856316, "precision": 0.8888256065611118, "recall": 0.9200565970993987, "support": 8481.0 }, "eval_accuracy": 0.940484568211521, "eval_loss": 0.20142190158367157, "eval_macro avg": { "f1-score": 0.919566429427859, "precision": 0.9121213138589797, "recall": 0.9274209094437321, "support": 29841.0 }, "eval_runtime": 1.3501, "eval_samples_per_second": 59.256, "eval_steps_per_second": 7.407, "eval_weighted avg": { "f1-score": 0.9408087707079646, "precision": 0.9414063343289258, "recall": 0.940484568211521, "support": 29841.0 }, "step": 287 }, { "epoch": 8.0, "eval_B": { "f1-score": 0.8921130952380952, "precision": 0.8607322325915291, "recall": 0.9258687258687258, "support": 1295.0 }, "eval_I": { "f1-score": 0.9613341204250295, "precision": 0.9490554125588849, "recall": 0.9739347121853975, "support": 20065.0 }, "eval_O": { "f1-score": 0.9013343126453666, "precision": 0.9371261295659921, "recall": 0.8681759226506308, "support": 8481.0 }, "eval_accuracy": 0.9417914949230924, "eval_loss": 0.21689558029174805, "eval_macro avg": { "f1-score": 0.9182605094361639, "precision": 0.9156379249054686, "recall": 0.9226597869015847, "support": 29841.0 }, "eval_runtime": 1.3576, "eval_samples_per_second": 58.928, "eval_steps_per_second": 7.366, "eval_weighted avg": { "f1-score": 0.9412778355352336, "precision": 0.9418321034499257, "recall": 0.9417914949230924, "support": 29841.0 }, "step": 328 }, { "epoch": 9.0, "eval_B": { "f1-score": 0.8985947588302315, "precision": 0.8841554559043349, "recall": 0.9135135135135135, "support": 1295.0 }, "eval_I": { "f1-score": 0.9622013609496847, "precision": 0.958962427602594, "recall": 0.9654622476949912, "support": 20065.0 }, "eval_O": { "f1-score": 0.9079425609247452, "precision": 0.9177306673090821, "recall": 0.8983610423299139, "support": 8481.0 }, "eval_accuracy": 0.9441372608156563, "eval_loss": 0.23563022911548615, "eval_macro avg": { "f1-score": 0.9229128935682205, "precision": 0.9202828502720036, "recall": 0.9257789345128061, "support": 29841.0 }, "eval_runtime": 1.3543, "eval_samples_per_second": 59.071, "eval_steps_per_second": 7.384, "eval_weighted avg": { "f1-score": 0.944020353853535, "precision": 0.9439977284504704, "recall": 0.9441372608156563, "support": 29841.0 }, "step": 369 }, { "epoch": 10.0, "eval_B": { "f1-score": 0.883806713389893, "precision": 0.846045197740113, "recall": 0.9250965250965251, "support": 1295.0 }, "eval_I": { "f1-score": 0.9612357047378584, "precision": 0.9549009000147544, "recall": 0.9676551208572141, "support": 20065.0 }, "eval_O": { "f1-score": 0.904241839135944, "precision": 0.9259762728620861, "recall": 0.8835043037377668, "support": 8481.0 }, "eval_accuracy": 0.9418920277470594, "eval_loss": 0.2491447478532791, "eval_macro avg": { "f1-score": 0.9164280857545651, "precision": 0.9089741235389845, "recall": 0.9254186498971686, "support": 29841.0 }, "eval_runtime": 1.3513, "eval_samples_per_second": 59.204, "eval_steps_per_second": 7.401, "eval_weighted avg": { "f1-score": 0.9416775291416837, "precision": 0.941956364063297, "recall": 0.9418920277470594, "support": 29841.0 }, "step": 410 }, { "epoch": 11.0, "eval_B": { "f1-score": 0.8962935230250841, "precision": 0.8699127906976745, "recall": 0.9243243243243243, "support": 1295.0 }, "eval_I": { "f1-score": 0.9609275419158742, "precision": 0.9454922579711543, "recall": 0.9768751557438325, "support": 20065.0 }, "eval_O": { "f1-score": 0.8992907801418439, "precision": 0.9427204551331781, "recall": 0.8596863577408325, "support": 8481.0 }, "eval_accuracy": 0.9412888308032573, "eval_loss": 0.2823159396648407, "eval_macro avg": { "f1-score": 0.9188372816942675, "precision": 0.9193751679340023, "recall": 0.9202952792696631, "support": 29841.0 }, "eval_runtime": 1.359, "eval_samples_per_second": 58.865, "eval_steps_per_second": 7.358, "eval_weighted avg": { "f1-score": 0.9406050851929385, "precision": 0.9414245970352596, "recall": 0.9412888308032573, "support": 29841.0 }, "step": 451 }, { "epoch": 12.0, "eval_B": { "f1-score": 0.896006028636021, "precision": 0.8749080206033848, "recall": 0.9181467181467181, "support": 1295.0 }, "eval_I": { "f1-score": 0.9606028094513335, "precision": 0.9618267212950934, "recall": 0.9593820084724645, "support": 20065.0 }, "eval_O": { "f1-score": 0.9053041477373296, "precision": 0.9059990552668871, "recall": 0.9046103053885155, "support": 8481.0 }, "eval_accuracy": 0.9420260715123487, "eval_loss": 0.2665592133998871, "eval_macro avg": { "f1-score": 0.9206376619415613, "precision": 0.9142445990551217, "recall": 0.9273796773358992, "support": 29841.0 }, "eval_runtime": 1.3553, "eval_samples_per_second": 59.028, "eval_steps_per_second": 7.379, "eval_weighted avg": { "f1-score": 0.9420832966618057, "precision": 0.9421881651816595, "recall": 0.9420260715123487, "support": 29841.0 }, "step": 492 } ], "logging_steps": 500, "max_steps": 656, "num_input_tokens_seen": 0, "num_train_epochs": 16, "save_steps": 500, "total_flos": 1725439832827200.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }