{ "best_metric": 0.7780054113531673, "best_model_checkpoint": "bart-base/checkpoint-10288", "epoch": 23.0, "eval_steps": 500, "global_step": 14789, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.78, "learning_rate": 4.871176775531364e-05, "loss": 1.2028, "step": 500 }, { "epoch": 1.0, "eval_accuracy": 0.7598760650658405, "eval_f1_macro": 0.6063644681337579, "eval_f1_micro": 0.7598760650658405, "eval_f1_weighted": 0.7489266744747745, "eval_loss": 0.8429557681083679, "eval_macro_fpr": 0.023226157303183535, "eval_macro_sensitivity": 0.6366904609623596, "eval_macro_specificity": 0.981694425945952, "eval_precision": 0.7600880594489849, "eval_precision_macro": 0.6003620126022547, "eval_recall": 0.7598760650658405, "eval_recall_macro": 0.6366904609623596, "eval_runtime": 43.5934, "eval_samples_per_second": 29.615, "eval_steps_per_second": 3.716, "eval_weighted_fpr": 0.02207348333808032, "eval_weighted_sensitivity": 0.7598760650658405, "eval_weighted_specificity": 0.9655403241234398, "step": 643 }, { "epoch": 1.56, "learning_rate": 4.741575946086055e-05, "loss": 0.715, "step": 1000 }, { "epoch": 2.0, "eval_accuracy": 0.7931835786212239, "eval_f1_macro": 0.7213629796675549, "eval_f1_micro": 0.793183578621224, "eval_f1_weighted": 0.7853477061503886, "eval_loss": 0.7331996560096741, "eval_macro_fpr": 0.018982515099395962, "eval_macro_sensitivity": 0.7320748785168393, "eval_macro_specificity": 0.9845140063777027, "eval_precision": 0.8019650926098448, "eval_precision_macro": 0.7386000214414028, "eval_recall": 0.7931835786212239, "eval_recall_macro": 0.7320748785168393, "eval_runtime": 77.2393, "eval_samples_per_second": 16.714, "eval_steps_per_second": 2.097, "eval_weighted_fpr": 0.018283914264192288, "eval_weighted_sensitivity": 0.7931835786212239, "eval_weighted_specificity": 0.9745265170443169, "step": 1286 }, { "epoch": 2.33, "learning_rate": 4.611975116640747e-05, "loss": 0.578, "step": 1500 }, { "epoch": 3.0, "eval_accuracy": 0.7939581719597212, "eval_f1_macro": 0.6998313050068915, "eval_f1_micro": 0.7939581719597211, "eval_f1_weighted": 0.79006368267302, "eval_loss": 0.8045273423194885, "eval_macro_fpr": 0.018545878882531782, "eval_macro_sensitivity": 0.7068834234702027, "eval_macro_specificity": 0.9847671550097226, "eval_precision": 0.8075005963568469, "eval_precision_macro": 0.7230632440844518, "eval_recall": 0.7939581719597212, "eval_recall_macro": 0.7068834234702027, "eval_runtime": 86.4099, "eval_samples_per_second": 14.94, "eval_steps_per_second": 1.875, "eval_weighted_fpr": 0.018199233716475097, "eval_weighted_sensitivity": 0.7939581719597212, "eval_weighted_specificity": 0.977549153186118, "step": 1929 }, { "epoch": 3.11, "learning_rate": 4.482633488854329e-05, "loss": 0.481, "step": 2000 }, { "epoch": 3.89, "learning_rate": 4.3530326594090203e-05, "loss": 0.3938, "step": 2500 }, { "epoch": 4.0, "eval_accuracy": 0.8156467854376452, "eval_f1_macro": 0.7369315728111729, "eval_f1_micro": 0.8156467854376452, "eval_f1_weighted": 0.8105168035589256, "eval_loss": 0.8291025161743164, "eval_macro_fpr": 0.016938074954137138, "eval_macro_sensitivity": 0.7217605983180461, "eval_macro_specificity": 0.9857842035419169, "eval_precision": 0.8171220006778526, "eval_precision_macro": 0.7937034642937142, "eval_recall": 0.8156467854376452, "eval_recall_macro": 0.7217605983180461, "eval_runtime": 84.4366, "eval_samples_per_second": 15.29, "eval_steps_per_second": 1.919, "eval_weighted_fpr": 0.01588785046728972, "eval_weighted_sensitivity": 0.8156467854376452, "eval_weighted_specificity": 0.9711162676911109, "step": 2572 }, { "epoch": 4.67, "learning_rate": 4.2236910316226025e-05, "loss": 0.3238, "step": 3000 }, { "epoch": 5.0, "eval_accuracy": 0.7939581719597212, "eval_f1_macro": 0.7360579650857649, "eval_f1_micro": 0.7939581719597211, "eval_f1_weighted": 0.7995200606905476, "eval_loss": 0.8888681530952454, "eval_macro_fpr": 0.018767728188278533, "eval_macro_sensitivity": 0.7515467286591376, "eval_macro_specificity": 0.9846803211687324, "eval_precision": 0.8146370555192632, "eval_precision_macro": 0.7464262358644205, "eval_recall": 0.7939581719597212, "eval_recall_macro": 0.7515467286591376, "eval_runtime": 82.179, "eval_samples_per_second": 15.71, "eval_steps_per_second": 1.971, "eval_weighted_fpr": 0.018199233716475097, "eval_weighted_sensitivity": 0.7939581719597212, "eval_weighted_specificity": 0.9762466455712672, "step": 3215 }, { "epoch": 5.44, "learning_rate": 4.094090202177294e-05, "loss": 0.246, "step": 3500 }, { "epoch": 6.0, "eval_accuracy": 0.7955073586367157, "eval_f1_macro": 0.7362210043644567, "eval_f1_micro": 0.7955073586367158, "eval_f1_weighted": 0.7945977979999089, "eval_loss": 1.1628626585006714, "eval_macro_fpr": 0.01863187379355594, "eval_macro_sensitivity": 0.7599986341032186, "eval_macro_specificity": 0.9846932142915057, "eval_precision": 0.8066758597712774, "eval_precision_macro": 0.7483163388808308, "eval_recall": 0.7955073586367157, "eval_recall_macro": 0.7599986341032186, "eval_runtime": 82.1621, "eval_samples_per_second": 15.713, "eval_steps_per_second": 1.972, "eval_weighted_fpr": 0.018030323726266905, "eval_weighted_sensitivity": 0.7955073586367157, "eval_weighted_specificity": 0.9748908557358684, "step": 3858 }, { "epoch": 6.22, "learning_rate": 3.964489372731986e-05, "loss": 0.228, "step": 4000 }, { "epoch": 7.0, "learning_rate": 3.834888543286677e-05, "loss": 0.1791, "step": 4500 }, { "epoch": 7.0, "eval_accuracy": 0.8179705654531371, "eval_f1_macro": 0.7736489492761546, "eval_f1_micro": 0.817970565453137, "eval_f1_weighted": 0.8146592022169725, "eval_loss": 1.1354283094406128, "eval_macro_fpr": 0.016454731140779742, "eval_macro_sensitivity": 0.7696557438486226, "eval_macro_specificity": 0.9861772746118799, "eval_precision": 0.8150792023791334, "eval_precision_macro": 0.7832166669456337, "eval_recall": 0.8179705654531371, "eval_recall_macro": 0.7696557438486226, "eval_runtime": 85.4548, "eval_samples_per_second": 15.107, "eval_steps_per_second": 1.896, "eval_weighted_fpr": 0.01564684732671949, "eval_weighted_sensitivity": 0.8179705654531371, "eval_weighted_specificity": 0.9746885537250626, "step": 4501 }, { "epoch": 7.78, "learning_rate": 3.705546915500259e-05, "loss": 0.1305, "step": 5000 }, { "epoch": 8.0, "eval_accuracy": 0.8109992254066615, "eval_f1_macro": 0.7368975448573482, "eval_f1_micro": 0.8109992254066615, "eval_f1_weighted": 0.808822910649843, "eval_loss": 1.282464861869812, "eval_macro_fpr": 0.016943107063520774, "eval_macro_sensitivity": 0.7488577570944955, "eval_macro_specificity": 0.9858309939135591, "eval_precision": 0.8147632227505013, "eval_precision_macro": 0.7422132710401315, "eval_recall": 0.8109992254066615, "eval_recall_macro": 0.7488577570944955, "eval_runtime": 87.6049, "eval_samples_per_second": 14.737, "eval_steps_per_second": 1.849, "eval_weighted_fpr": 0.016373641121997046, "eval_weighted_sensitivity": 0.8109992254066615, "eval_weighted_specificity": 0.9764656832967246, "step": 5144 }, { "epoch": 8.55, "learning_rate": 3.575946086054951e-05, "loss": 0.0924, "step": 5500 }, { "epoch": 9.0, "eval_accuracy": 0.8040278853601859, "eval_f1_macro": 0.7559721746710123, "eval_f1_micro": 0.8040278853601859, "eval_f1_weighted": 0.80145679310201, "eval_loss": 1.421708583831787, "eval_macro_fpr": 0.017802568540250287, "eval_macro_sensitivity": 0.7809236600744539, "eval_macro_specificity": 0.9853492039682624, "eval_precision": 0.8113877598541575, "eval_precision_macro": 0.7464644897074477, "eval_recall": 0.8040278853601859, "eval_recall_macro": 0.7809236600744539, "eval_runtime": 89.5999, "eval_samples_per_second": 14.408, "eval_steps_per_second": 1.808, "eval_weighted_fpr": 0.017111937774771727, "eval_weighted_sensitivity": 0.8040278853601859, "eval_weighted_specificity": 0.9762101741637506, "step": 5787 }, { "epoch": 9.33, "learning_rate": 3.446345256609643e-05, "loss": 0.0953, "step": 6000 }, { "epoch": 10.0, "eval_accuracy": 0.8024786986831913, "eval_f1_macro": 0.7661426626929498, "eval_f1_micro": 0.8024786986831914, "eval_f1_weighted": 0.8001228885030943, "eval_loss": 1.5552372932434082, "eval_macro_fpr": 0.018250858387380567, "eval_macro_sensitivity": 0.7822186507003115, "eval_macro_specificity": 0.9849087494473102, "eval_precision": 0.8055922813865947, "eval_precision_macro": 0.7702182213697708, "eval_recall": 0.8024786986831913, "eval_recall_macro": 0.7822186507003115, "eval_runtime": 85.2534, "eval_samples_per_second": 15.143, "eval_steps_per_second": 1.9, "eval_weighted_fpr": 0.017277593332881633, "eval_weighted_sensitivity": 0.8024786986831913, "eval_weighted_specificity": 0.9711525430264618, "step": 6430 }, { "epoch": 10.11, "learning_rate": 3.316744427164334e-05, "loss": 0.0668, "step": 6500 }, { "epoch": 10.89, "learning_rate": 3.1871435977190256e-05, "loss": 0.0617, "step": 7000 }, { "epoch": 11.0, "eval_accuracy": 0.8040278853601859, "eval_f1_macro": 0.7422420279485343, "eval_f1_micro": 0.8040278853601859, "eval_f1_weighted": 0.8069943234338898, "eval_loss": 1.5223894119262695, "eval_macro_fpr": 0.017602619829831197, "eval_macro_sensitivity": 0.7512050029477755, "eval_macro_specificity": 0.9853474796083734, "eval_precision": 0.8144253833246468, "eval_precision_macro": 0.745702567690635, "eval_recall": 0.8040278853601859, "eval_recall_macro": 0.7512050029477755, "eval_runtime": 85.7004, "eval_samples_per_second": 15.064, "eval_steps_per_second": 1.89, "eval_weighted_fpr": 0.017111937774771727, "eval_weighted_sensitivity": 0.8040278853601859, "eval_weighted_specificity": 0.9761843087654142, "step": 7073 }, { "epoch": 11.66, "learning_rate": 3.057542768273717e-05, "loss": 0.0582, "step": 7500 }, { "epoch": 12.0, "eval_accuracy": 0.7970565453137103, "eval_f1_macro": 0.7465072775190384, "eval_f1_micro": 0.7970565453137104, "eval_f1_weighted": 0.8021748784206515, "eval_loss": 1.6427809000015259, "eval_macro_fpr": 0.01832354936918133, "eval_macro_sensitivity": 0.7654834054509102, "eval_macro_specificity": 0.9849466228972559, "eval_precision": 0.8148454054398186, "eval_precision_macro": 0.7470312881962948, "eval_recall": 0.7970565453137103, "eval_recall_macro": 0.7654834054509102, "eval_runtime": 95.4565, "eval_samples_per_second": 13.524, "eval_steps_per_second": 1.697, "eval_weighted_fpr": 0.017862012544314153, "eval_weighted_sensitivity": 0.7970565453137103, "eval_weighted_specificity": 0.9771427981451267, "step": 7716 }, { "epoch": 12.44, "learning_rate": 2.9279419388284086e-05, "loss": 0.0511, "step": 8000 }, { "epoch": 13.0, "eval_accuracy": 0.8195197521301317, "eval_f1_macro": 0.7586168211948496, "eval_f1_micro": 0.8195197521301317, "eval_f1_weighted": 0.8186828900418365, "eval_loss": 1.4951962232589722, "eval_macro_fpr": 0.016182326988526896, "eval_macro_sensitivity": 0.7580273333502953, "eval_macro_specificity": 0.9863597979839632, "eval_precision": 0.8208277188287908, "eval_precision_macro": 0.7645206618886077, "eval_recall": 0.8195197521301317, "eval_recall_macro": 0.7580273333502953, "eval_runtime": 85.8279, "eval_samples_per_second": 15.042, "eval_steps_per_second": 1.887, "eval_weighted_fpr": 0.01548687271518777, "eval_weighted_sensitivity": 0.8195197521301317, "eval_weighted_specificity": 0.9758772176293167, "step": 8359 }, { "epoch": 13.22, "learning_rate": 2.7983411093831004e-05, "loss": 0.0403, "step": 8500 }, { "epoch": 14.0, "learning_rate": 2.668740279937792e-05, "loss": 0.0476, "step": 9000 }, { "epoch": 14.0, "eval_accuracy": 0.7970565453137103, "eval_f1_macro": 0.7416650578915932, "eval_f1_micro": 0.7970565453137104, "eval_f1_weighted": 0.7913296065268454, "eval_loss": 1.7132102251052856, "eval_macro_fpr": 0.018853564171086353, "eval_macro_sensitivity": 0.7328360987022614, "eval_macro_specificity": 0.9845211676049321, "eval_precision": 0.795801987953062, "eval_precision_macro": 0.763738385548772, "eval_recall": 0.7970565453137103, "eval_recall_macro": 0.7328360987022614, "eval_runtime": 90.1914, "eval_samples_per_second": 14.314, "eval_steps_per_second": 1.796, "eval_weighted_fpr": 0.017862012544314153, "eval_weighted_sensitivity": 0.7970565453137103, "eval_weighted_specificity": 0.9707609687602743, "step": 9002 }, { "epoch": 14.77, "learning_rate": 2.5391394504924833e-05, "loss": 0.0375, "step": 9500 }, { "epoch": 15.0, "eval_accuracy": 0.8001549186676995, "eval_f1_macro": 0.7437118125777374, "eval_f1_micro": 0.8001549186676995, "eval_f1_weighted": 0.8017305518379161, "eval_loss": 1.7058144807815552, "eval_macro_fpr": 0.018188016275518495, "eval_macro_sensitivity": 0.7696355635707867, "eval_macro_specificity": 0.9850538317438372, "eval_precision": 0.8109768674187026, "eval_precision_macro": 0.7369403978788467, "eval_recall": 0.8001549186676995, "eval_recall_macro": 0.7696355635707867, "eval_runtime": 89.6171, "eval_samples_per_second": 14.406, "eval_steps_per_second": 1.808, "eval_weighted_fpr": 0.017527173913043478, "eval_weighted_sensitivity": 0.8001549186676995, "eval_weighted_specificity": 0.9756525574898595, "step": 9645 }, { "epoch": 15.55, "learning_rate": 2.4095386210471748e-05, "loss": 0.0241, "step": 10000 }, { "epoch": 16.0, "eval_accuracy": 0.8179705654531371, "eval_f1_macro": 0.7780054113531673, "eval_f1_micro": 0.817970565453137, "eval_f1_weighted": 0.8174074193030834, "eval_loss": 1.7145990133285522, "eval_macro_fpr": 0.01624192113353871, "eval_macro_sensitivity": 0.7786912615456476, "eval_macro_specificity": 0.9862689663514356, "eval_precision": 0.8189471437742178, "eval_precision_macro": 0.7852139494262297, "eval_recall": 0.8179705654531371, "eval_recall_macro": 0.7786912615456476, "eval_runtime": 95.9969, "eval_samples_per_second": 13.448, "eval_steps_per_second": 1.688, "eval_weighted_fpr": 0.01564684732671949, "eval_weighted_sensitivity": 0.8179705654531371, "eval_weighted_specificity": 0.9760639298183975, "step": 10288 }, { "epoch": 16.33, "learning_rate": 2.280196993260757e-05, "loss": 0.0226, "step": 10500 }, { "epoch": 17.0, "eval_accuracy": 0.820294345468629, "eval_f1_macro": 0.7713653883357572, "eval_f1_micro": 0.8202943454686291, "eval_f1_weighted": 0.8205584776004088, "eval_loss": 1.703484296798706, "eval_macro_fpr": 0.015955392684873622, "eval_macro_sensitivity": 0.7780791588964692, "eval_macro_specificity": 0.9865149979627027, "eval_precision": 0.8238197570339643, "eval_precision_macro": 0.7731970694747214, "eval_recall": 0.820294345468629, "eval_recall_macro": 0.7780791588964692, "eval_runtime": 92.4633, "eval_samples_per_second": 13.962, "eval_steps_per_second": 1.752, "eval_weighted_fpr": 0.015407092575375215, "eval_weighted_sensitivity": 0.820294345468629, "eval_weighted_specificity": 0.9774306239719132, "step": 10931 }, { "epoch": 17.11, "learning_rate": 2.1505961638154484e-05, "loss": 0.017, "step": 11000 }, { "epoch": 17.88, "learning_rate": 2.0209953343701402e-05, "loss": 0.0189, "step": 11500 }, { "epoch": 18.0, "eval_accuracy": 0.8164213787761425, "eval_f1_macro": 0.7577737009484876, "eval_f1_micro": 0.8164213787761425, "eval_f1_weighted": 0.814862576730404, "eval_loss": 1.8079380989074707, "eval_macro_fpr": 0.016561980735895838, "eval_macro_sensitivity": 0.7677111310031827, "eval_macro_specificity": 0.9860906809860878, "eval_precision": 0.8160431006408752, "eval_precision_macro": 0.7583264160007077, "eval_recall": 0.8164213787761425, "eval_recall_macro": 0.7677111310031827, "eval_runtime": 93.2101, "eval_samples_per_second": 13.85, "eval_steps_per_second": 1.738, "eval_weighted_fpr": 0.01580737677582872, "eval_weighted_sensitivity": 0.8164213787761425, "eval_weighted_specificity": 0.9749388360151747, "step": 11574 }, { "epoch": 18.66, "learning_rate": 1.8913945049248317e-05, "loss": 0.026, "step": 12000 }, { "epoch": 19.0, "eval_accuracy": 0.8125484120836561, "eval_f1_macro": 0.7718943136435594, "eval_f1_micro": 0.8125484120836561, "eval_f1_weighted": 0.8138445092504973, "eval_loss": 1.8187031745910645, "eval_macro_fpr": 0.016881633170148187, "eval_macro_sensitivity": 0.7832768313344278, "eval_macro_specificity": 0.9858228106032249, "eval_precision": 0.8169875491486152, "eval_precision_macro": 0.7674779420581895, "eval_recall": 0.8125484120836561, "eval_recall_macro": 0.7832768313344278, "eval_runtime": 90.0764, "eval_samples_per_second": 14.332, "eval_steps_per_second": 1.798, "eval_weighted_fpr": 0.016211146838156484, "eval_weighted_sensitivity": 0.8125484120836561, "eval_weighted_specificity": 0.9747937469647154, "step": 12217 }, { "epoch": 19.44, "learning_rate": 1.761793675479523e-05, "loss": 0.0101, "step": 12500 }, { "epoch": 20.0, "eval_accuracy": 0.8187451587916343, "eval_f1_macro": 0.7709574718137391, "eval_f1_micro": 0.8187451587916342, "eval_f1_weighted": 0.8179619842347855, "eval_loss": 1.8353675603866577, "eval_macro_fpr": 0.01611361621724302, "eval_macro_sensitivity": 0.7817701569841005, "eval_macro_specificity": 0.9863995310478259, "eval_precision": 0.8219549803396689, "eval_precision_macro": 0.7748222861859084, "eval_recall": 0.8187451587916343, "eval_recall_macro": 0.7817701569841005, "eval_runtime": 86.3867, "eval_samples_per_second": 14.944, "eval_steps_per_second": 1.875, "eval_weighted_fpr": 0.015566790846194785, "eval_weighted_sensitivity": 0.8187451587916343, "eval_weighted_specificity": 0.9772478069257525, "step": 12860 }, { "epoch": 20.22, "learning_rate": 1.632192846034215e-05, "loss": 0.0097, "step": 13000 }, { "epoch": 21.0, "learning_rate": 1.502851218247797e-05, "loss": 0.0216, "step": 13500 }, { "epoch": 21.0, "eval_accuracy": 0.8156467854376452, "eval_f1_macro": 0.7618079234508338, "eval_f1_micro": 0.8156467854376452, "eval_f1_weighted": 0.8164347717885334, "eval_loss": 1.8372349739074707, "eval_macro_fpr": 0.016334927583449652, "eval_macro_sensitivity": 0.7857843546777831, "eval_macro_specificity": 0.9863030854921722, "eval_precision": 0.8219293193926849, "eval_precision_macro": 0.7502422859641604, "eval_recall": 0.8156467854376452, "eval_recall_macro": 0.7857843546777831, "eval_runtime": 87.8538, "eval_samples_per_second": 14.695, "eval_steps_per_second": 1.844, "eval_weighted_fpr": 0.01588785046728972, "eval_weighted_sensitivity": 0.8156467854376452, "eval_weighted_specificity": 0.9788994969449356, "step": 13503 }, { "epoch": 21.77, "learning_rate": 1.3732503888024884e-05, "loss": 0.0138, "step": 14000 }, { "epoch": 22.0, "eval_accuracy": 0.820294345468629, "eval_f1_macro": 0.7661945549993608, "eval_f1_micro": 0.8202943454686291, "eval_f1_weighted": 0.8222065987286614, "eval_loss": 1.8472038507461548, "eval_macro_fpr": 0.015872843311496198, "eval_macro_sensitivity": 0.7796378584356709, "eval_macro_specificity": 0.9865941123818214, "eval_precision": 0.8262928188362502, "eval_precision_macro": 0.7613141480374475, "eval_recall": 0.820294345468629, "eval_recall_macro": 0.7796378584356709, "eval_runtime": 85.3935, "eval_samples_per_second": 15.118, "eval_steps_per_second": 1.897, "eval_weighted_fpr": 0.015407092575375215, "eval_weighted_sensitivity": 0.820294345468629, "eval_weighted_specificity": 0.9786173402586936, "step": 14146 }, { "epoch": 22.55, "learning_rate": 1.2436495593571799e-05, "loss": 0.0169, "step": 14500 }, { "epoch": 23.0, "eval_accuracy": 0.8218435321456236, "eval_f1_macro": 0.760658140409385, "eval_f1_micro": 0.8218435321456236, "eval_f1_weighted": 0.8209229699908378, "eval_loss": 1.8103588819503784, "eval_macro_fpr": 0.016045052484127836, "eval_macro_sensitivity": 0.7595040114200765, "eval_macro_specificity": 0.986451381533847, "eval_precision": 0.8251783607661838, "eval_precision_macro": 0.7718974635406236, "eval_recall": 0.8218435321456236, "eval_recall_macro": 0.7595040114200765, "eval_runtime": 92.1092, "eval_samples_per_second": 14.016, "eval_steps_per_second": 1.759, "eval_weighted_fpr": 0.015247944842216919, "eval_weighted_sensitivity": 0.8218435321456236, "eval_weighted_specificity": 0.9749271908620799, "step": 14789 } ], "logging_steps": 500, "max_steps": 19290, "num_train_epochs": 30, "save_steps": 500, "total_flos": 3.624608859075994e+16, "trial_name": null, "trial_params": null }