|
{ |
|
"best_metric": 0.7780054113531673, |
|
"best_model_checkpoint": "bart-base/checkpoint-10288", |
|
"epoch": 27.0, |
|
"eval_steps": 500, |
|
"global_step": 17361, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.78, |
|
"learning_rate": 4.871176775531364e-05, |
|
"loss": 1.2028, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.7598760650658405, |
|
"eval_f1_macro": 0.6063644681337579, |
|
"eval_f1_micro": 0.7598760650658405, |
|
"eval_f1_weighted": 0.7489266744747745, |
|
"eval_loss": 0.8429557681083679, |
|
"eval_macro_fpr": 0.023226157303183535, |
|
"eval_macro_sensitivity": 0.6366904609623596, |
|
"eval_macro_specificity": 0.981694425945952, |
|
"eval_precision": 0.7600880594489849, |
|
"eval_precision_macro": 0.6003620126022547, |
|
"eval_recall": 0.7598760650658405, |
|
"eval_recall_macro": 0.6366904609623596, |
|
"eval_runtime": 43.5934, |
|
"eval_samples_per_second": 29.615, |
|
"eval_steps_per_second": 3.716, |
|
"eval_weighted_fpr": 0.02207348333808032, |
|
"eval_weighted_sensitivity": 0.7598760650658405, |
|
"eval_weighted_specificity": 0.9655403241234398, |
|
"step": 643 |
|
}, |
|
{ |
|
"epoch": 1.56, |
|
"learning_rate": 4.741575946086055e-05, |
|
"loss": 0.715, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7931835786212239, |
|
"eval_f1_macro": 0.7213629796675549, |
|
"eval_f1_micro": 0.793183578621224, |
|
"eval_f1_weighted": 0.7853477061503886, |
|
"eval_loss": 0.7331996560096741, |
|
"eval_macro_fpr": 0.018982515099395962, |
|
"eval_macro_sensitivity": 0.7320748785168393, |
|
"eval_macro_specificity": 0.9845140063777027, |
|
"eval_precision": 0.8019650926098448, |
|
"eval_precision_macro": 0.7386000214414028, |
|
"eval_recall": 0.7931835786212239, |
|
"eval_recall_macro": 0.7320748785168393, |
|
"eval_runtime": 77.2393, |
|
"eval_samples_per_second": 16.714, |
|
"eval_steps_per_second": 2.097, |
|
"eval_weighted_fpr": 0.018283914264192288, |
|
"eval_weighted_sensitivity": 0.7931835786212239, |
|
"eval_weighted_specificity": 0.9745265170443169, |
|
"step": 1286 |
|
}, |
|
{ |
|
"epoch": 2.33, |
|
"learning_rate": 4.611975116640747e-05, |
|
"loss": 0.578, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.7939581719597212, |
|
"eval_f1_macro": 0.6998313050068915, |
|
"eval_f1_micro": 0.7939581719597211, |
|
"eval_f1_weighted": 0.79006368267302, |
|
"eval_loss": 0.8045273423194885, |
|
"eval_macro_fpr": 0.018545878882531782, |
|
"eval_macro_sensitivity": 0.7068834234702027, |
|
"eval_macro_specificity": 0.9847671550097226, |
|
"eval_precision": 0.8075005963568469, |
|
"eval_precision_macro": 0.7230632440844518, |
|
"eval_recall": 0.7939581719597212, |
|
"eval_recall_macro": 0.7068834234702027, |
|
"eval_runtime": 86.4099, |
|
"eval_samples_per_second": 14.94, |
|
"eval_steps_per_second": 1.875, |
|
"eval_weighted_fpr": 0.018199233716475097, |
|
"eval_weighted_sensitivity": 0.7939581719597212, |
|
"eval_weighted_specificity": 0.977549153186118, |
|
"step": 1929 |
|
}, |
|
{ |
|
"epoch": 3.11, |
|
"learning_rate": 4.482633488854329e-05, |
|
"loss": 0.481, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 3.89, |
|
"learning_rate": 4.3530326594090203e-05, |
|
"loss": 0.3938, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8156467854376452, |
|
"eval_f1_macro": 0.7369315728111729, |
|
"eval_f1_micro": 0.8156467854376452, |
|
"eval_f1_weighted": 0.8105168035589256, |
|
"eval_loss": 0.8291025161743164, |
|
"eval_macro_fpr": 0.016938074954137138, |
|
"eval_macro_sensitivity": 0.7217605983180461, |
|
"eval_macro_specificity": 0.9857842035419169, |
|
"eval_precision": 0.8171220006778526, |
|
"eval_precision_macro": 0.7937034642937142, |
|
"eval_recall": 0.8156467854376452, |
|
"eval_recall_macro": 0.7217605983180461, |
|
"eval_runtime": 84.4366, |
|
"eval_samples_per_second": 15.29, |
|
"eval_steps_per_second": 1.919, |
|
"eval_weighted_fpr": 0.01588785046728972, |
|
"eval_weighted_sensitivity": 0.8156467854376452, |
|
"eval_weighted_specificity": 0.9711162676911109, |
|
"step": 2572 |
|
}, |
|
{ |
|
"epoch": 4.67, |
|
"learning_rate": 4.2236910316226025e-05, |
|
"loss": 0.3238, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.7939581719597212, |
|
"eval_f1_macro": 0.7360579650857649, |
|
"eval_f1_micro": 0.7939581719597211, |
|
"eval_f1_weighted": 0.7995200606905476, |
|
"eval_loss": 0.8888681530952454, |
|
"eval_macro_fpr": 0.018767728188278533, |
|
"eval_macro_sensitivity": 0.7515467286591376, |
|
"eval_macro_specificity": 0.9846803211687324, |
|
"eval_precision": 0.8146370555192632, |
|
"eval_precision_macro": 0.7464262358644205, |
|
"eval_recall": 0.7939581719597212, |
|
"eval_recall_macro": 0.7515467286591376, |
|
"eval_runtime": 82.179, |
|
"eval_samples_per_second": 15.71, |
|
"eval_steps_per_second": 1.971, |
|
"eval_weighted_fpr": 0.018199233716475097, |
|
"eval_weighted_sensitivity": 0.7939581719597212, |
|
"eval_weighted_specificity": 0.9762466455712672, |
|
"step": 3215 |
|
}, |
|
{ |
|
"epoch": 5.44, |
|
"learning_rate": 4.094090202177294e-05, |
|
"loss": 0.246, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.7955073586367157, |
|
"eval_f1_macro": 0.7362210043644567, |
|
"eval_f1_micro": 0.7955073586367158, |
|
"eval_f1_weighted": 0.7945977979999089, |
|
"eval_loss": 1.1628626585006714, |
|
"eval_macro_fpr": 0.01863187379355594, |
|
"eval_macro_sensitivity": 0.7599986341032186, |
|
"eval_macro_specificity": 0.9846932142915057, |
|
"eval_precision": 0.8066758597712774, |
|
"eval_precision_macro": 0.7483163388808308, |
|
"eval_recall": 0.7955073586367157, |
|
"eval_recall_macro": 0.7599986341032186, |
|
"eval_runtime": 82.1621, |
|
"eval_samples_per_second": 15.713, |
|
"eval_steps_per_second": 1.972, |
|
"eval_weighted_fpr": 0.018030323726266905, |
|
"eval_weighted_sensitivity": 0.7955073586367157, |
|
"eval_weighted_specificity": 0.9748908557358684, |
|
"step": 3858 |
|
}, |
|
{ |
|
"epoch": 6.22, |
|
"learning_rate": 3.964489372731986e-05, |
|
"loss": 0.228, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 3.834888543286677e-05, |
|
"loss": 0.1791, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.8179705654531371, |
|
"eval_f1_macro": 0.7736489492761546, |
|
"eval_f1_micro": 0.817970565453137, |
|
"eval_f1_weighted": 0.8146592022169725, |
|
"eval_loss": 1.1354283094406128, |
|
"eval_macro_fpr": 0.016454731140779742, |
|
"eval_macro_sensitivity": 0.7696557438486226, |
|
"eval_macro_specificity": 0.9861772746118799, |
|
"eval_precision": 0.8150792023791334, |
|
"eval_precision_macro": 0.7832166669456337, |
|
"eval_recall": 0.8179705654531371, |
|
"eval_recall_macro": 0.7696557438486226, |
|
"eval_runtime": 85.4548, |
|
"eval_samples_per_second": 15.107, |
|
"eval_steps_per_second": 1.896, |
|
"eval_weighted_fpr": 0.01564684732671949, |
|
"eval_weighted_sensitivity": 0.8179705654531371, |
|
"eval_weighted_specificity": 0.9746885537250626, |
|
"step": 4501 |
|
}, |
|
{ |
|
"epoch": 7.78, |
|
"learning_rate": 3.705546915500259e-05, |
|
"loss": 0.1305, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8109992254066615, |
|
"eval_f1_macro": 0.7368975448573482, |
|
"eval_f1_micro": 0.8109992254066615, |
|
"eval_f1_weighted": 0.808822910649843, |
|
"eval_loss": 1.282464861869812, |
|
"eval_macro_fpr": 0.016943107063520774, |
|
"eval_macro_sensitivity": 0.7488577570944955, |
|
"eval_macro_specificity": 0.9858309939135591, |
|
"eval_precision": 0.8147632227505013, |
|
"eval_precision_macro": 0.7422132710401315, |
|
"eval_recall": 0.8109992254066615, |
|
"eval_recall_macro": 0.7488577570944955, |
|
"eval_runtime": 87.6049, |
|
"eval_samples_per_second": 14.737, |
|
"eval_steps_per_second": 1.849, |
|
"eval_weighted_fpr": 0.016373641121997046, |
|
"eval_weighted_sensitivity": 0.8109992254066615, |
|
"eval_weighted_specificity": 0.9764656832967246, |
|
"step": 5144 |
|
}, |
|
{ |
|
"epoch": 8.55, |
|
"learning_rate": 3.575946086054951e-05, |
|
"loss": 0.0924, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.8040278853601859, |
|
"eval_f1_macro": 0.7559721746710123, |
|
"eval_f1_micro": 0.8040278853601859, |
|
"eval_f1_weighted": 0.80145679310201, |
|
"eval_loss": 1.421708583831787, |
|
"eval_macro_fpr": 0.017802568540250287, |
|
"eval_macro_sensitivity": 0.7809236600744539, |
|
"eval_macro_specificity": 0.9853492039682624, |
|
"eval_precision": 0.8113877598541575, |
|
"eval_precision_macro": 0.7464644897074477, |
|
"eval_recall": 0.8040278853601859, |
|
"eval_recall_macro": 0.7809236600744539, |
|
"eval_runtime": 89.5999, |
|
"eval_samples_per_second": 14.408, |
|
"eval_steps_per_second": 1.808, |
|
"eval_weighted_fpr": 0.017111937774771727, |
|
"eval_weighted_sensitivity": 0.8040278853601859, |
|
"eval_weighted_specificity": 0.9762101741637506, |
|
"step": 5787 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"learning_rate": 3.446345256609643e-05, |
|
"loss": 0.0953, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.8024786986831913, |
|
"eval_f1_macro": 0.7661426626929498, |
|
"eval_f1_micro": 0.8024786986831914, |
|
"eval_f1_weighted": 0.8001228885030943, |
|
"eval_loss": 1.5552372932434082, |
|
"eval_macro_fpr": 0.018250858387380567, |
|
"eval_macro_sensitivity": 0.7822186507003115, |
|
"eval_macro_specificity": 0.9849087494473102, |
|
"eval_precision": 0.8055922813865947, |
|
"eval_precision_macro": 0.7702182213697708, |
|
"eval_recall": 0.8024786986831913, |
|
"eval_recall_macro": 0.7822186507003115, |
|
"eval_runtime": 85.2534, |
|
"eval_samples_per_second": 15.143, |
|
"eval_steps_per_second": 1.9, |
|
"eval_weighted_fpr": 0.017277593332881633, |
|
"eval_weighted_sensitivity": 0.8024786986831913, |
|
"eval_weighted_specificity": 0.9711525430264618, |
|
"step": 6430 |
|
}, |
|
{ |
|
"epoch": 10.11, |
|
"learning_rate": 3.316744427164334e-05, |
|
"loss": 0.0668, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 10.89, |
|
"learning_rate": 3.1871435977190256e-05, |
|
"loss": 0.0617, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.8040278853601859, |
|
"eval_f1_macro": 0.7422420279485343, |
|
"eval_f1_micro": 0.8040278853601859, |
|
"eval_f1_weighted": 0.8069943234338898, |
|
"eval_loss": 1.5223894119262695, |
|
"eval_macro_fpr": 0.017602619829831197, |
|
"eval_macro_sensitivity": 0.7512050029477755, |
|
"eval_macro_specificity": 0.9853474796083734, |
|
"eval_precision": 0.8144253833246468, |
|
"eval_precision_macro": 0.745702567690635, |
|
"eval_recall": 0.8040278853601859, |
|
"eval_recall_macro": 0.7512050029477755, |
|
"eval_runtime": 85.7004, |
|
"eval_samples_per_second": 15.064, |
|
"eval_steps_per_second": 1.89, |
|
"eval_weighted_fpr": 0.017111937774771727, |
|
"eval_weighted_sensitivity": 0.8040278853601859, |
|
"eval_weighted_specificity": 0.9761843087654142, |
|
"step": 7073 |
|
}, |
|
{ |
|
"epoch": 11.66, |
|
"learning_rate": 3.057542768273717e-05, |
|
"loss": 0.0582, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.7970565453137103, |
|
"eval_f1_macro": 0.7465072775190384, |
|
"eval_f1_micro": 0.7970565453137104, |
|
"eval_f1_weighted": 0.8021748784206515, |
|
"eval_loss": 1.6427809000015259, |
|
"eval_macro_fpr": 0.01832354936918133, |
|
"eval_macro_sensitivity": 0.7654834054509102, |
|
"eval_macro_specificity": 0.9849466228972559, |
|
"eval_precision": 0.8148454054398186, |
|
"eval_precision_macro": 0.7470312881962948, |
|
"eval_recall": 0.7970565453137103, |
|
"eval_recall_macro": 0.7654834054509102, |
|
"eval_runtime": 95.4565, |
|
"eval_samples_per_second": 13.524, |
|
"eval_steps_per_second": 1.697, |
|
"eval_weighted_fpr": 0.017862012544314153, |
|
"eval_weighted_sensitivity": 0.7970565453137103, |
|
"eval_weighted_specificity": 0.9771427981451267, |
|
"step": 7716 |
|
}, |
|
{ |
|
"epoch": 12.44, |
|
"learning_rate": 2.9279419388284086e-05, |
|
"loss": 0.0511, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.8195197521301317, |
|
"eval_f1_macro": 0.7586168211948496, |
|
"eval_f1_micro": 0.8195197521301317, |
|
"eval_f1_weighted": 0.8186828900418365, |
|
"eval_loss": 1.4951962232589722, |
|
"eval_macro_fpr": 0.016182326988526896, |
|
"eval_macro_sensitivity": 0.7580273333502953, |
|
"eval_macro_specificity": 0.9863597979839632, |
|
"eval_precision": 0.8208277188287908, |
|
"eval_precision_macro": 0.7645206618886077, |
|
"eval_recall": 0.8195197521301317, |
|
"eval_recall_macro": 0.7580273333502953, |
|
"eval_runtime": 85.8279, |
|
"eval_samples_per_second": 15.042, |
|
"eval_steps_per_second": 1.887, |
|
"eval_weighted_fpr": 0.01548687271518777, |
|
"eval_weighted_sensitivity": 0.8195197521301317, |
|
"eval_weighted_specificity": 0.9758772176293167, |
|
"step": 8359 |
|
}, |
|
{ |
|
"epoch": 13.22, |
|
"learning_rate": 2.7983411093831004e-05, |
|
"loss": 0.0403, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"learning_rate": 2.668740279937792e-05, |
|
"loss": 0.0476, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.7970565453137103, |
|
"eval_f1_macro": 0.7416650578915932, |
|
"eval_f1_micro": 0.7970565453137104, |
|
"eval_f1_weighted": 0.7913296065268454, |
|
"eval_loss": 1.7132102251052856, |
|
"eval_macro_fpr": 0.018853564171086353, |
|
"eval_macro_sensitivity": 0.7328360987022614, |
|
"eval_macro_specificity": 0.9845211676049321, |
|
"eval_precision": 0.795801987953062, |
|
"eval_precision_macro": 0.763738385548772, |
|
"eval_recall": 0.7970565453137103, |
|
"eval_recall_macro": 0.7328360987022614, |
|
"eval_runtime": 90.1914, |
|
"eval_samples_per_second": 14.314, |
|
"eval_steps_per_second": 1.796, |
|
"eval_weighted_fpr": 0.017862012544314153, |
|
"eval_weighted_sensitivity": 0.7970565453137103, |
|
"eval_weighted_specificity": 0.9707609687602743, |
|
"step": 9002 |
|
}, |
|
{ |
|
"epoch": 14.77, |
|
"learning_rate": 2.5391394504924833e-05, |
|
"loss": 0.0375, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_accuracy": 0.8001549186676995, |
|
"eval_f1_macro": 0.7437118125777374, |
|
"eval_f1_micro": 0.8001549186676995, |
|
"eval_f1_weighted": 0.8017305518379161, |
|
"eval_loss": 1.7058144807815552, |
|
"eval_macro_fpr": 0.018188016275518495, |
|
"eval_macro_sensitivity": 0.7696355635707867, |
|
"eval_macro_specificity": 0.9850538317438372, |
|
"eval_precision": 0.8109768674187026, |
|
"eval_precision_macro": 0.7369403978788467, |
|
"eval_recall": 0.8001549186676995, |
|
"eval_recall_macro": 0.7696355635707867, |
|
"eval_runtime": 89.6171, |
|
"eval_samples_per_second": 14.406, |
|
"eval_steps_per_second": 1.808, |
|
"eval_weighted_fpr": 0.017527173913043478, |
|
"eval_weighted_sensitivity": 0.8001549186676995, |
|
"eval_weighted_specificity": 0.9756525574898595, |
|
"step": 9645 |
|
}, |
|
{ |
|
"epoch": 15.55, |
|
"learning_rate": 2.4095386210471748e-05, |
|
"loss": 0.0241, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.8179705654531371, |
|
"eval_f1_macro": 0.7780054113531673, |
|
"eval_f1_micro": 0.817970565453137, |
|
"eval_f1_weighted": 0.8174074193030834, |
|
"eval_loss": 1.7145990133285522, |
|
"eval_macro_fpr": 0.01624192113353871, |
|
"eval_macro_sensitivity": 0.7786912615456476, |
|
"eval_macro_specificity": 0.9862689663514356, |
|
"eval_precision": 0.8189471437742178, |
|
"eval_precision_macro": 0.7852139494262297, |
|
"eval_recall": 0.8179705654531371, |
|
"eval_recall_macro": 0.7786912615456476, |
|
"eval_runtime": 95.9969, |
|
"eval_samples_per_second": 13.448, |
|
"eval_steps_per_second": 1.688, |
|
"eval_weighted_fpr": 0.01564684732671949, |
|
"eval_weighted_sensitivity": 0.8179705654531371, |
|
"eval_weighted_specificity": 0.9760639298183975, |
|
"step": 10288 |
|
}, |
|
{ |
|
"epoch": 16.33, |
|
"learning_rate": 2.280196993260757e-05, |
|
"loss": 0.0226, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_accuracy": 0.820294345468629, |
|
"eval_f1_macro": 0.7713653883357572, |
|
"eval_f1_micro": 0.8202943454686291, |
|
"eval_f1_weighted": 0.8205584776004088, |
|
"eval_loss": 1.703484296798706, |
|
"eval_macro_fpr": 0.015955392684873622, |
|
"eval_macro_sensitivity": 0.7780791588964692, |
|
"eval_macro_specificity": 0.9865149979627027, |
|
"eval_precision": 0.8238197570339643, |
|
"eval_precision_macro": 0.7731970694747214, |
|
"eval_recall": 0.820294345468629, |
|
"eval_recall_macro": 0.7780791588964692, |
|
"eval_runtime": 92.4633, |
|
"eval_samples_per_second": 13.962, |
|
"eval_steps_per_second": 1.752, |
|
"eval_weighted_fpr": 0.015407092575375215, |
|
"eval_weighted_sensitivity": 0.820294345468629, |
|
"eval_weighted_specificity": 0.9774306239719132, |
|
"step": 10931 |
|
}, |
|
{ |
|
"epoch": 17.11, |
|
"learning_rate": 2.1505961638154484e-05, |
|
"loss": 0.017, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 17.88, |
|
"learning_rate": 2.0209953343701402e-05, |
|
"loss": 0.0189, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_accuracy": 0.8164213787761425, |
|
"eval_f1_macro": 0.7577737009484876, |
|
"eval_f1_micro": 0.8164213787761425, |
|
"eval_f1_weighted": 0.814862576730404, |
|
"eval_loss": 1.8079380989074707, |
|
"eval_macro_fpr": 0.016561980735895838, |
|
"eval_macro_sensitivity": 0.7677111310031827, |
|
"eval_macro_specificity": 0.9860906809860878, |
|
"eval_precision": 0.8160431006408752, |
|
"eval_precision_macro": 0.7583264160007077, |
|
"eval_recall": 0.8164213787761425, |
|
"eval_recall_macro": 0.7677111310031827, |
|
"eval_runtime": 93.2101, |
|
"eval_samples_per_second": 13.85, |
|
"eval_steps_per_second": 1.738, |
|
"eval_weighted_fpr": 0.01580737677582872, |
|
"eval_weighted_sensitivity": 0.8164213787761425, |
|
"eval_weighted_specificity": 0.9749388360151747, |
|
"step": 11574 |
|
}, |
|
{ |
|
"epoch": 18.66, |
|
"learning_rate": 1.8913945049248317e-05, |
|
"loss": 0.026, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_accuracy": 0.8125484120836561, |
|
"eval_f1_macro": 0.7718943136435594, |
|
"eval_f1_micro": 0.8125484120836561, |
|
"eval_f1_weighted": 0.8138445092504973, |
|
"eval_loss": 1.8187031745910645, |
|
"eval_macro_fpr": 0.016881633170148187, |
|
"eval_macro_sensitivity": 0.7832768313344278, |
|
"eval_macro_specificity": 0.9858228106032249, |
|
"eval_precision": 0.8169875491486152, |
|
"eval_precision_macro": 0.7674779420581895, |
|
"eval_recall": 0.8125484120836561, |
|
"eval_recall_macro": 0.7832768313344278, |
|
"eval_runtime": 90.0764, |
|
"eval_samples_per_second": 14.332, |
|
"eval_steps_per_second": 1.798, |
|
"eval_weighted_fpr": 0.016211146838156484, |
|
"eval_weighted_sensitivity": 0.8125484120836561, |
|
"eval_weighted_specificity": 0.9747937469647154, |
|
"step": 12217 |
|
}, |
|
{ |
|
"epoch": 19.44, |
|
"learning_rate": 1.761793675479523e-05, |
|
"loss": 0.0101, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 0.8187451587916343, |
|
"eval_f1_macro": 0.7709574718137391, |
|
"eval_f1_micro": 0.8187451587916342, |
|
"eval_f1_weighted": 0.8179619842347855, |
|
"eval_loss": 1.8353675603866577, |
|
"eval_macro_fpr": 0.01611361621724302, |
|
"eval_macro_sensitivity": 0.7817701569841005, |
|
"eval_macro_specificity": 0.9863995310478259, |
|
"eval_precision": 0.8219549803396689, |
|
"eval_precision_macro": 0.7748222861859084, |
|
"eval_recall": 0.8187451587916343, |
|
"eval_recall_macro": 0.7817701569841005, |
|
"eval_runtime": 86.3867, |
|
"eval_samples_per_second": 14.944, |
|
"eval_steps_per_second": 1.875, |
|
"eval_weighted_fpr": 0.015566790846194785, |
|
"eval_weighted_sensitivity": 0.8187451587916343, |
|
"eval_weighted_specificity": 0.9772478069257525, |
|
"step": 12860 |
|
}, |
|
{ |
|
"epoch": 20.22, |
|
"learning_rate": 1.632192846034215e-05, |
|
"loss": 0.0097, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"learning_rate": 1.502851218247797e-05, |
|
"loss": 0.0216, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_accuracy": 0.8156467854376452, |
|
"eval_f1_macro": 0.7618079234508338, |
|
"eval_f1_micro": 0.8156467854376452, |
|
"eval_f1_weighted": 0.8164347717885334, |
|
"eval_loss": 1.8372349739074707, |
|
"eval_macro_fpr": 0.016334927583449652, |
|
"eval_macro_sensitivity": 0.7857843546777831, |
|
"eval_macro_specificity": 0.9863030854921722, |
|
"eval_precision": 0.8219293193926849, |
|
"eval_precision_macro": 0.7502422859641604, |
|
"eval_recall": 0.8156467854376452, |
|
"eval_recall_macro": 0.7857843546777831, |
|
"eval_runtime": 87.8538, |
|
"eval_samples_per_second": 14.695, |
|
"eval_steps_per_second": 1.844, |
|
"eval_weighted_fpr": 0.01588785046728972, |
|
"eval_weighted_sensitivity": 0.8156467854376452, |
|
"eval_weighted_specificity": 0.9788994969449356, |
|
"step": 13503 |
|
}, |
|
{ |
|
"epoch": 21.77, |
|
"learning_rate": 1.3732503888024884e-05, |
|
"loss": 0.0138, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_accuracy": 0.820294345468629, |
|
"eval_f1_macro": 0.7661945549993608, |
|
"eval_f1_micro": 0.8202943454686291, |
|
"eval_f1_weighted": 0.8222065987286614, |
|
"eval_loss": 1.8472038507461548, |
|
"eval_macro_fpr": 0.015872843311496198, |
|
"eval_macro_sensitivity": 0.7796378584356709, |
|
"eval_macro_specificity": 0.9865941123818214, |
|
"eval_precision": 0.8262928188362502, |
|
"eval_precision_macro": 0.7613141480374475, |
|
"eval_recall": 0.820294345468629, |
|
"eval_recall_macro": 0.7796378584356709, |
|
"eval_runtime": 85.3935, |
|
"eval_samples_per_second": 15.118, |
|
"eval_steps_per_second": 1.897, |
|
"eval_weighted_fpr": 0.015407092575375215, |
|
"eval_weighted_sensitivity": 0.820294345468629, |
|
"eval_weighted_specificity": 0.9786173402586936, |
|
"step": 14146 |
|
}, |
|
{ |
|
"epoch": 22.55, |
|
"learning_rate": 1.2436495593571799e-05, |
|
"loss": 0.0169, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_accuracy": 0.8218435321456236, |
|
"eval_f1_macro": 0.760658140409385, |
|
"eval_f1_micro": 0.8218435321456236, |
|
"eval_f1_weighted": 0.8209229699908378, |
|
"eval_loss": 1.8103588819503784, |
|
"eval_macro_fpr": 0.016045052484127836, |
|
"eval_macro_sensitivity": 0.7595040114200765, |
|
"eval_macro_specificity": 0.986451381533847, |
|
"eval_precision": 0.8251783607661838, |
|
"eval_precision_macro": 0.7718974635406236, |
|
"eval_recall": 0.8218435321456236, |
|
"eval_recall_macro": 0.7595040114200765, |
|
"eval_runtime": 92.1092, |
|
"eval_samples_per_second": 14.016, |
|
"eval_steps_per_second": 1.759, |
|
"eval_weighted_fpr": 0.015247944842216919, |
|
"eval_weighted_sensitivity": 0.8218435321456236, |
|
"eval_weighted_specificity": 0.9749271908620799, |
|
"step": 14789 |
|
}, |
|
{ |
|
"epoch": 23.33, |
|
"learning_rate": 1.1140487299118715e-05, |
|
"loss": 0.0079, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 0.8109992254066615, |
|
"eval_f1_macro": 0.7524207866195778, |
|
"eval_f1_micro": 0.8109992254066615, |
|
"eval_f1_weighted": 0.8122562112865754, |
|
"eval_loss": 1.9252820014953613, |
|
"eval_macro_fpr": 0.017055628961045247, |
|
"eval_macro_sensitivity": 0.7576415197380852, |
|
"eval_macro_specificity": 0.985793052330349, |
|
"eval_precision": 0.8202456922159745, |
|
"eval_precision_macro": 0.7621718512762216, |
|
"eval_recall": 0.8109992254066615, |
|
"eval_recall_macro": 0.7576415197380852, |
|
"eval_runtime": 93.885, |
|
"eval_samples_per_second": 13.751, |
|
"eval_steps_per_second": 1.726, |
|
"eval_weighted_fpr": 0.016373641121997046, |
|
"eval_weighted_sensitivity": 0.8109992254066615, |
|
"eval_weighted_specificity": 0.9758965595485739, |
|
"step": 15432 |
|
}, |
|
{ |
|
"epoch": 24.11, |
|
"learning_rate": 9.84447900466563e-06, |
|
"loss": 0.0094, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 24.88, |
|
"learning_rate": 8.551062726801453e-06, |
|
"loss": 0.0017, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_accuracy": 0.8156467854376452, |
|
"eval_f1_macro": 0.7594027956673404, |
|
"eval_f1_micro": 0.8156467854376452, |
|
"eval_f1_weighted": 0.8154952009918864, |
|
"eval_loss": 1.9110798835754395, |
|
"eval_macro_fpr": 0.016444882591068778, |
|
"eval_macro_sensitivity": 0.7742299386060195, |
|
"eval_macro_specificity": 0.9862078449547576, |
|
"eval_precision": 0.8193166881646313, |
|
"eval_precision_macro": 0.7554028042588868, |
|
"eval_recall": 0.8156467854376452, |
|
"eval_recall_macro": 0.7742299386060195, |
|
"eval_runtime": 92.0946, |
|
"eval_samples_per_second": 14.018, |
|
"eval_steps_per_second": 1.759, |
|
"eval_weighted_fpr": 0.01588785046728972, |
|
"eval_weighted_sensitivity": 0.8156467854376452, |
|
"eval_weighted_specificity": 0.97747088888372, |
|
"step": 16075 |
|
}, |
|
{ |
|
"epoch": 25.66, |
|
"learning_rate": 7.255054432348367e-06, |
|
"loss": 0.0071, |
|
"step": 16500 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_accuracy": 0.8187451587916343, |
|
"eval_f1_macro": 0.7601055992728972, |
|
"eval_f1_micro": 0.8187451587916342, |
|
"eval_f1_weighted": 0.8199059390372757, |
|
"eval_loss": 1.880871057510376, |
|
"eval_macro_fpr": 0.01605804835750131, |
|
"eval_macro_sensitivity": 0.7748936539821518, |
|
"eval_macro_specificity": 0.9864696047286632, |
|
"eval_precision": 0.824436161286693, |
|
"eval_precision_macro": 0.7594879689938191, |
|
"eval_recall": 0.8187451587916343, |
|
"eval_recall_macro": 0.7748936539821518, |
|
"eval_runtime": 88.2427, |
|
"eval_samples_per_second": 14.63, |
|
"eval_steps_per_second": 1.836, |
|
"eval_weighted_fpr": 0.015566790846194785, |
|
"eval_weighted_sensitivity": 0.8187451587916343, |
|
"eval_weighted_specificity": 0.9782989121383131, |
|
"step": 16718 |
|
}, |
|
{ |
|
"epoch": 26.44, |
|
"learning_rate": 5.9590461378952825e-06, |
|
"loss": 0.0032, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_accuracy": 0.8272656855151046, |
|
"eval_f1_macro": 0.7718154001656008, |
|
"eval_f1_micro": 0.8272656855151046, |
|
"eval_f1_weighted": 0.8288829948767273, |
|
"eval_loss": 1.8246089220046997, |
|
"eval_macro_fpr": 0.015208141271413749, |
|
"eval_macro_sensitivity": 0.7806866379450543, |
|
"eval_macro_specificity": 0.9870589996943918, |
|
"eval_precision": 0.8333256234957093, |
|
"eval_precision_macro": 0.772651547029787, |
|
"eval_recall": 0.8272656855151046, |
|
"eval_recall_macro": 0.7806866379450543, |
|
"eval_runtime": 86.7033, |
|
"eval_samples_per_second": 14.89, |
|
"eval_steps_per_second": 1.868, |
|
"eval_weighted_fpr": 0.014695222405271829, |
|
"eval_weighted_sensitivity": 0.8272656855151046, |
|
"eval_weighted_specificity": 0.9786193099007718, |
|
"step": 17361 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 19290, |
|
"num_train_epochs": 30, |
|
"save_steps": 500, |
|
"total_flos": 4.254975617176166e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|