{ "best_metric": null, "best_model_checkpoint": null, "epoch": 12.0, "eval_steps": 500, "global_step": 492, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_B": { "f1-score": 0.6659475008989573, "precision": 0.6905294556301268, "recall": 0.6430555555555556, "support": 1440.0 }, "eval_I": { "f1-score": 0.9167863956473609, "precision": 0.9325347388596071, "recall": 0.9015611247510076, "support": 21587.0 }, "eval_O": { "f1-score": 0.8443157797996509, "precision": 0.8138010452653025, "recall": 0.8772080588179128, "support": 10473.0 }, "eval_accuracy": 0.8828358208955224, "eval_loss": 0.31183817982673645, "eval_macro avg": { "f1-score": 0.8090165587819897, "precision": 0.8122884132516788, "recall": 0.8072749130414919, "support": 33500.0 }, "eval_runtime": 1.3725, "eval_samples_per_second": 59.018, "eval_steps_per_second": 8.015, "eval_weighted avg": { "f1-score": 0.8833478055515172, "precision": 0.8850127812218876, "recall": 0.8828358208955224, "support": 33500.0 }, "step": 41 }, { "epoch": 2.0, "eval_B": { "f1-score": 0.8377561303325496, "precision": 0.8113207547169812, "recall": 0.8659722222222223, "support": 1440.0 }, "eval_I": { "f1-score": 0.9473755107538951, "precision": 0.9191461555216729, "recall": 0.9773938018251725, "support": 21587.0 }, "eval_O": { "f1-score": 0.8803449514911966, "precision": 0.9519316163410302, "recall": 0.8187720805881791, "support": 10473.0 }, "eval_accuracy": 0.9230149253731343, "eval_loss": 0.22658132016658783, "eval_macro avg": { "f1-score": 0.8884921975258804, "precision": 0.8941328421932281, "recall": 0.8873793682118579, "support": 33500.0 }, "eval_runtime": 1.3801, "eval_samples_per_second": 58.69, "eval_steps_per_second": 7.97, "eval_weighted avg": { "f1-score": 0.9217079598594182, "precision": 0.9247608884769675, "recall": 0.9230149253731343, "support": 33500.0 }, "step": 82 }, { "epoch": 3.0, "eval_B": { "f1-score": 0.8710106382978723, "precision": 0.8354591836734694, "recall": 0.9097222222222222, "support": 1440.0 }, "eval_I": { "f1-score": 0.9543258273315707, "precision": 0.9392974112791063, "recall": 0.9698429610413675, "support": 21587.0 }, "eval_O": { "f1-score": 0.8996818452972758, "precision": 0.9384009125790729, "recall": 0.8640313186288552, "support": 10473.0 }, "eval_accuracy": 0.934179104477612, "eval_loss": 0.20443089306354523, "eval_macro avg": { "f1-score": 0.908339436975573, "precision": 0.9043858358438829, "recall": 0.9145321672974815, "support": 33500.0 }, "eval_runtime": 1.3812, "eval_samples_per_second": 58.646, "eval_steps_per_second": 7.964, "eval_weighted avg": { "f1-score": 0.9336613408822066, "precision": 0.9345536477376863, "recall": 0.934179104477612, "support": 33500.0 }, "step": 123 }, { "epoch": 4.0, "eval_B": { "f1-score": 0.8771342484097756, "precision": 0.8468002585649644, "recall": 0.9097222222222222, "support": 1440.0 }, "eval_I": { "f1-score": 0.959998160834981, "precision": 0.952900369677331, "recall": 0.9672024829758651, "support": 21587.0 }, "eval_O": { "f1-score": 0.9145503290275409, "precision": 0.9341764588727345, "recall": 0.8957318819822401, "support": 10473.0 }, "eval_accuracy": 0.9423880597014925, "eval_loss": 0.18545031547546387, "eval_macro avg": { "f1-score": 0.9172275794240993, "precision": 0.9112923623716767, "recall": 0.9242188623934425, "support": 33500.0 }, "eval_runtime": 1.377, "eval_samples_per_second": 58.824, "eval_steps_per_second": 7.988, "eval_weighted avg": { "f1-score": 0.9422280361659775, "precision": 0.9424860509352908, "recall": 0.9423880597014925, "support": 33500.0 }, "step": 164 }, { "epoch": 5.0, "eval_B": { "f1-score": 0.8835341365461846, "precision": 0.8527131782945736, "recall": 0.9166666666666666, "support": 1440.0 }, "eval_I": { "f1-score": 0.9602170394181884, "precision": 0.9453672113485365, "recall": 0.9755408347616621, "support": 21587.0 }, "eval_O": { "f1-score": 0.9125018611345476, "precision": 0.9500826787928897, "recall": 0.877780960565263, "support": 10473.0 }, "eval_accuracy": 0.9424477611940298, "eval_loss": 0.19699566066265106, "eval_macro avg": { "f1-score": 0.9187510123663069, "precision": 0.9160543561453333, "recall": 0.9233294873311971, "support": 33500.0 }, "eval_runtime": 1.3779, "eval_samples_per_second": 58.784, "eval_steps_per_second": 7.983, "eval_weighted avg": { "f1-score": 0.9420037724838524, "precision": 0.9428586526305366, "recall": 0.9424477611940298, "support": 33500.0 }, "step": 205 }, { "epoch": 6.0, "eval_B": { "f1-score": 0.882471457353929, "precision": 0.8543563068920677, "recall": 0.9125, "support": 1440.0 }, "eval_I": { "f1-score": 0.9563333022648896, "precision": 0.9621173050775939, "recall": 0.9506184277574466, "support": 21587.0 }, "eval_O": { "f1-score": 0.9094096465460059, "precision": 0.9025674786043449, "recall": 0.9163563448868519, "support": 10473.0 }, "eval_accuracy": 0.9382686567164179, "eval_loss": 0.22578871250152588, "eval_macro avg": { "f1-score": 0.9160714687216082, "precision": 0.9063470301913354, "recall": 0.9264915908814327, "support": 33500.0 }, "eval_runtime": 1.3827, "eval_samples_per_second": 58.582, "eval_steps_per_second": 7.956, "eval_weighted avg": { "f1-score": 0.9384887499360641, "precision": 0.9388683149271014, "recall": 0.9382686567164179, "support": 33500.0 }, "step": 246 }, { "epoch": 7.0, "eval_B": { "f1-score": 0.8892651540805959, "precision": 0.8678122934567085, "recall": 0.9118055555555555, "support": 1440.0 }, "eval_I": { "f1-score": 0.9597268994787103, "precision": 0.9557587173243901, "recall": 0.963728169731783, "support": 21587.0 }, "eval_O": { "f1-score": 0.914125549702798, "precision": 0.925440313111546, "recall": 0.903084121073236, "support": 10473.0 }, "eval_accuracy": 0.9425373134328359, "eval_loss": 0.22205175459384918, "eval_macro avg": { "f1-score": 0.9210392010873681, "precision": 0.9163371079642149, "recall": 0.9262059487868582, "support": 33500.0 }, "eval_runtime": 1.3808, "eval_samples_per_second": 58.663, "eval_steps_per_second": 7.967, "eval_weighted avg": { "f1-score": 0.9424418890435934, "precision": 0.9424999860500445, "recall": 0.9425373134328359, "support": 33500.0 }, "step": 287 }, { "epoch": 8.0, "eval_B": { "f1-score": 0.8742837883383889, "precision": 0.8493778650949574, "recall": 0.9006944444444445, "support": 1440.0 }, "eval_I": { "f1-score": 0.954344074989507, "precision": 0.9607962815155641, "recall": 0.9479779496919443, "support": 21587.0 }, "eval_O": { "f1-score": 0.9060386816096845, "precision": 0.8975079632752483, "recall": 0.9147331232693593, "support": 10473.0 }, "eval_accuracy": 0.9355522388059702, "eval_loss": 0.2697383165359497, "eval_macro avg": { "f1-score": 0.9115555149791934, "precision": 0.9025607032952566, "recall": 0.9211351724685827, "support": 33500.0 }, "eval_runtime": 1.3839, "eval_samples_per_second": 58.529, "eval_steps_per_second": 7.948, "eval_weighted avg": { "f1-score": 0.9358011138657909, "precision": 0.9362213240058178, "recall": 0.9355522388059702, "support": 33500.0 }, "step": 328 }, { "epoch": 9.0, "eval_B": { "f1-score": 0.8867732063923836, "precision": 0.8687541638907396, "recall": 0.9055555555555556, "support": 1440.0 }, "eval_I": { "f1-score": 0.9593785402168635, "precision": 0.9576294655220161, "recall": 0.9611340158428684, "support": 21587.0 }, "eval_O": { "f1-score": 0.9133903681630298, "precision": 0.9195780509048679, "recall": 0.907285400553805, "support": 10473.0 }, "eval_accuracy": 0.941910447761194, "eval_loss": 0.236963152885437, "eval_macro avg": { "f1-score": 0.9198473715907589, "precision": 0.9153205601058745, "recall": 0.9246583239840763, "support": 33500.0 }, "eval_runtime": 1.3821, "eval_samples_per_second": 58.608, "eval_steps_per_second": 7.959, "eval_weighted avg": { "f1-score": 0.9418804564369516, "precision": 0.9419132595627793, "recall": 0.941910447761194, "support": 33500.0 }, "step": 369 }, { "epoch": 10.0, "eval_B": { "f1-score": 0.8820989704417137, "precision": 0.8453214513049013, "recall": 0.9222222222222223, "support": 1440.0 }, "eval_I": { "f1-score": 0.9598799630655587, "precision": 0.956655776929094, "recall": 0.9631259554361421, "support": 21587.0 }, "eval_O": { "f1-score": 0.914896705210702, "precision": 0.9273244409572381, "recall": 0.9027976701995608, "support": 10473.0 }, "eval_accuracy": 0.9425074626865672, "eval_loss": 0.27435505390167236, "eval_macro avg": { "f1-score": 0.9189585462393248, "precision": 0.9097672230637445, "recall": 0.9293819492859751, "support": 33500.0 }, "eval_runtime": 1.375, "eval_samples_per_second": 58.909, "eval_steps_per_second": 8.0, "eval_weighted avg": { "f1-score": 0.9424735663822079, "precision": 0.9427002990027631, "recall": 0.9425074626865672, "support": 33500.0 }, "step": 410 }, { "epoch": 11.0, "eval_B": { "f1-score": 0.8886590830748018, "precision": 0.8822724161533196, "recall": 0.8951388888888889, "support": 1440.0 }, "eval_I": { "f1-score": 0.9554279336882978, "precision": 0.9591074596209505, "recall": 0.9517765321721406, "support": 21587.0 }, "eval_O": { "f1-score": 0.9066856330014225, "precision": 0.9005368748233964, "recall": 0.91291893440275, "support": 10473.0 }, "eval_accuracy": 0.9371940298507463, "eval_loss": 0.29653802514076233, "eval_macro avg": { "f1-score": 0.916924216588174, "precision": 0.9139722501992221, "recall": 0.9199447851545933, "support": 33500.0 }, "eval_runtime": 1.3782, "eval_samples_per_second": 58.771, "eval_steps_per_second": 7.981, "eval_weighted avg": { "f1-score": 0.9373197169725641, "precision": 0.9374939611977214, "recall": 0.9371940298507463, "support": 33500.0 }, "step": 451 }, { "epoch": 12.0, "eval_B": { "f1-score": 0.8851788756388416, "precision": 0.8688963210702341, "recall": 0.9020833333333333, "support": 1440.0 }, "eval_I": { "f1-score": 0.956586582154592, "precision": 0.9624402138235019, "recall": 0.9508037244637977, "support": 21587.0 }, "eval_O": { "f1-score": 0.9096066565809379, "precision": 0.9008334113681056, "recall": 0.9185524682516948, "support": 10473.0 }, "eval_accuracy": 0.9386268656716418, "eval_loss": 0.3317875564098358, "eval_macro avg": { "f1-score": 0.9171240381247904, "precision": 0.9107233154206137, "recall": 0.9238131753496086, "support": 33500.0 }, "eval_runtime": 1.3866, "eval_samples_per_second": 58.418, "eval_steps_per_second": 7.933, "eval_weighted avg": { "f1-score": 0.9388299296795006, "precision": 0.9391592810569325, "recall": 0.9386268656716418, "support": 33500.0 }, "step": 492 } ], "logging_steps": 500, "max_steps": 656, "num_input_tokens_seen": 0, "num_train_epochs": 16, "save_steps": 500, "total_flos": 1720081324029600.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }