{ "best_metric": 0.6261172643852387, "best_model_checkpoint": "bart-base-lora/checkpoint-2250", "epoch": 13.996889580093313, "eval_steps": 500, "global_step": 2250, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.611154144074361, "eval_f1_macro": 0.28705545756004525, "eval_f1_micro": 0.611154144074361, "eval_f1_weighted": 0.5574695078229231, "eval_loss": 1.3204560279846191, "eval_macro_fpr": 0.046390243375546196, "eval_macro_sensitivity": 0.302378554842108, "eval_macro_specificity": 0.9691815961629444, "eval_precision": 0.5321554731456403, "eval_precision_macro": 0.2887439395071009, "eval_recall": 0.611154144074361, "eval_recall_macro": 0.302378554842108, "eval_runtime": 45.1674, "eval_samples_per_second": 28.583, "eval_steps_per_second": 3.587, "eval_weighted_fpr": 0.04347073086248701, "eval_weighted_sensitivity": 0.611154144074361, "eval_weighted_specificity": 0.9265697983698051, "step": 160 }, { "epoch": 2.0, "eval_accuracy": 0.6994577846630519, "eval_f1_macro": 0.3947617401663212, "eval_f1_micro": 0.6994577846630519, "eval_f1_weighted": 0.6807748226338182, "eval_loss": 0.887535810470581, "eval_macro_fpr": 0.03062685085400977, "eval_macro_sensitivity": 0.4253981018601158, "eval_macro_specificity": 0.977359054380045, "eval_precision": 0.6728416067370143, "eval_precision_macro": 0.3822291983692299, "eval_recall": 0.6994577846630519, "eval_recall_macro": 0.4253981018601158, "eval_runtime": 44.0045, "eval_samples_per_second": 29.338, "eval_steps_per_second": 3.681, "eval_weighted_fpr": 0.02977743668457406, "eval_weighted_sensitivity": 0.6994577846630519, "eval_weighted_specificity": 0.9609280310376243, "step": 321 }, { "epoch": 3.0, "eval_accuracy": 0.7064291247095275, "eval_f1_macro": 0.39687975393644837, "eval_f1_micro": 0.7064291247095275, "eval_f1_weighted": 0.6751887743731854, "eval_loss": 0.842707633972168, "eval_macro_fpr": 0.029525759570689643, "eval_macro_sensitivity": 0.44418263304043937, "eval_macro_specificity": 0.9780349023882488, "eval_precision": 0.6951917464608133, "eval_precision_macro": 0.4131313886422618, "eval_recall": 0.7064291247095275, "eval_recall_macro": 0.44418263304043937, "eval_runtime": 44.2756, "eval_samples_per_second": 29.158, "eval_steps_per_second": 3.659, "eval_weighted_fpr": 0.02882786947592607, "eval_weighted_sensitivity": 0.7064291247095275, "eval_weighted_specificity": 0.9640944111142056, "step": 482 }, { "epoch": 3.11, "learning_rate": 3.958333333333333e-05, "loss": 1.2895, "step": 500 }, { "epoch": 4.0, "eval_accuracy": 0.7273431448489543, "eval_f1_macro": 0.42839565617146974, "eval_f1_micro": 0.7273431448489543, "eval_f1_weighted": 0.7166656051521775, "eval_loss": 0.7718679904937744, "eval_macro_fpr": 0.026373610346420835, "eval_macro_sensitivity": 0.4597947061276887, "eval_macro_specificity": 0.9797578098165848, "eval_precision": 0.7132141916978711, "eval_precision_macro": 0.41981312370683244, "eval_recall": 0.7273431448489543, "eval_recall_macro": 0.4597947061276887, "eval_runtime": 44.0471, "eval_samples_per_second": 29.31, "eval_steps_per_second": 3.678, "eval_weighted_fpr": 0.026077937472218107, "eval_weighted_sensitivity": 0.7273431448489543, "eval_weighted_specificity": 0.9690240023998159, "step": 643 }, { "epoch": 5.0, "eval_accuracy": 0.750580945003873, "eval_f1_macro": 0.5071625387211971, "eval_f1_micro": 0.750580945003873, "eval_f1_weighted": 0.7368350875727435, "eval_loss": 0.7387559413909912, "eval_macro_fpr": 0.02390193870216418, "eval_macro_sensitivity": 0.5165232292614671, "eval_macro_specificity": 0.9813510652812688, "eval_precision": 0.739991301984922, "eval_precision_macro": 0.5733174750951799, "eval_recall": 0.750580945003873, "eval_recall_macro": 0.5165232292614671, "eval_runtime": 43.5191, "eval_samples_per_second": 29.665, "eval_steps_per_second": 3.723, "eval_weighted_fpr": 0.023185483870967742, "eval_weighted_sensitivity": 0.750580945003873, "eval_weighted_specificity": 0.9696850342151593, "step": 803 }, { "epoch": 6.0, "eval_accuracy": 0.7443841982958946, "eval_f1_macro": 0.508766573370445, "eval_f1_micro": 0.7443841982958946, "eval_f1_weighted": 0.726841801268282, "eval_loss": 0.7526118755340576, "eval_macro_fpr": 0.024741953499129225, "eval_macro_sensitivity": 0.5229557335240369, "eval_macro_specificity": 0.980899976318631, "eval_precision": 0.7337183019873953, "eval_precision_macro": 0.5703412270657953, "eval_recall": 0.7443841982958946, "eval_recall_macro": 0.5229557335240369, "eval_runtime": 43.7116, "eval_samples_per_second": 29.534, "eval_steps_per_second": 3.706, "eval_weighted_fpr": 0.023940800928612886, "eval_weighted_sensitivity": 0.7443841982958946, "eval_weighted_specificity": 0.9691154464835722, "step": 964 }, { "epoch": 6.22, "learning_rate": 2.916666666666667e-05, "loss": 0.7332, "step": 1000 }, { "epoch": 7.0, "eval_accuracy": 0.7552285050348567, "eval_f1_macro": 0.5608894910772386, "eval_f1_micro": 0.7552285050348567, "eval_f1_weighted": 0.7460771491633669, "eval_loss": 0.7082085609436035, "eval_macro_fpr": 0.02329269548734161, "eval_macro_sensitivity": 0.5727565701904757, "eval_macro_specificity": 0.9817624646436656, "eval_precision": 0.7436383222975608, "eval_precision_macro": 0.5665418243254761, "eval_recall": 0.7552285050348567, "eval_recall_macro": 0.5727565701904757, "eval_runtime": 43.8592, "eval_samples_per_second": 29.435, "eval_steps_per_second": 3.694, "eval_weighted_fpr": 0.02262637834741515, "eval_weighted_sensitivity": 0.7552285050348567, "eval_weighted_specificity": 0.9712084646201266, "step": 1125 }, { "epoch": 8.0, "eval_accuracy": 0.7583268783888458, "eval_f1_macro": 0.5755845408528306, "eval_f1_micro": 0.7583268783888458, "eval_f1_weighted": 0.7502605827076951, "eval_loss": 0.7160602807998657, "eval_macro_fpr": 0.022834923601538912, "eval_macro_sensitivity": 0.5974764193374731, "eval_macro_specificity": 0.9820281006961107, "eval_precision": 0.7489019370925815, "eval_precision_macro": 0.5641453776326693, "eval_recall": 0.7583268783888458, "eval_recall_macro": 0.5974764193374731, "eval_runtime": 47.4544, "eval_samples_per_second": 27.205, "eval_steps_per_second": 3.414, "eval_weighted_fpr": 0.022257098016835498, "eval_weighted_sensitivity": 0.7583268783888458, "eval_weighted_specificity": 0.9720946320528147, "step": 1286 }, { "epoch": 9.0, "eval_accuracy": 0.7776917118512781, "eval_f1_macro": 0.5874833340927881, "eval_f1_micro": 0.7776917118512781, "eval_f1_weighted": 0.7653015782806978, "eval_loss": 0.683149516582489, "eval_macro_fpr": 0.020831516213897273, "eval_macro_sensitivity": 0.606896137249408, "eval_macro_specificity": 0.9832816294136357, "eval_precision": 0.7586915140412427, "eval_precision_macro": 0.5780981033617572, "eval_recall": 0.7776917118512781, "eval_recall_macro": 0.606896137249408, "eval_runtime": 50.31, "eval_samples_per_second": 25.661, "eval_steps_per_second": 3.22, "eval_weighted_fpr": 0.02000976085895559, "eval_weighted_sensitivity": 0.7776917118512781, "eval_weighted_specificity": 0.9715327293532582, "step": 1446 }, { "epoch": 9.33, "learning_rate": 1.8750000000000002e-05, "loss": 0.6167, "step": 1500 }, { "epoch": 10.0, "eval_accuracy": 0.7862122385747483, "eval_f1_macro": 0.5987413950993845, "eval_f1_micro": 0.7862122385747482, "eval_f1_weighted": 0.7753590541094936, "eval_loss": 0.6683156490325928, "eval_macro_fpr": 0.019819293314469463, "eval_macro_sensitivity": 0.617364154098103, "eval_macro_specificity": 0.9839313497952282, "eval_precision": 0.7714272913975577, "eval_precision_macro": 0.5916700769971839, "eval_recall": 0.7862122385747483, "eval_recall_macro": 0.617364154098103, "eval_runtime": 46.3094, "eval_samples_per_second": 27.878, "eval_steps_per_second": 3.498, "eval_weighted_fpr": 0.019052878641446915, "eval_weighted_sensitivity": 0.7862122385747483, "eval_weighted_specificity": 0.972758008353676, "step": 1607 }, { "epoch": 11.0, "eval_accuracy": 0.7761425251742835, "eval_f1_macro": 0.5945805235654043, "eval_f1_micro": 0.7761425251742835, "eval_f1_weighted": 0.7642426809512617, "eval_loss": 0.6884666085243225, "eval_macro_fpr": 0.020959556505082782, "eval_macro_sensitivity": 0.6219516621776988, "eval_macro_specificity": 0.9832325403042509, "eval_precision": 0.762752032263232, "eval_precision_macro": 0.581742682634886, "eval_recall": 0.7761425251742835, "eval_recall_macro": 0.6219516621776988, "eval_runtime": 44.4944, "eval_samples_per_second": 29.015, "eval_steps_per_second": 3.641, "eval_weighted_fpr": 0.02018579311308235, "eval_weighted_sensitivity": 0.7761425251742835, "eval_weighted_specificity": 0.9723455793894815, "step": 1768 }, { "epoch": 12.0, "eval_accuracy": 0.7869868319132456, "eval_f1_macro": 0.6214234200731922, "eval_f1_micro": 0.7869868319132455, "eval_f1_weighted": 0.7764436224395941, "eval_loss": 0.6829659938812256, "eval_macro_fpr": 0.01971781574074696, "eval_macro_sensitivity": 0.6463770170214457, "eval_macro_specificity": 0.9840270123264785, "eval_precision": 0.7826408792667282, "eval_precision_macro": 0.6626773170335125, "eval_recall": 0.7869868319132456, "eval_recall_macro": 0.6463770170214457, "eval_runtime": 43.9944, "eval_samples_per_second": 29.345, "eval_steps_per_second": 3.682, "eval_weighted_fpr": 0.018966825298296436, "eval_weighted_sensitivity": 0.7869868319132456, "eval_weighted_specificity": 0.9734183529839338, "step": 1929 }, { "epoch": 12.44, "learning_rate": 8.333333333333334e-06, "loss": 0.5314, "step": 2000 }, { "epoch": 13.0, "eval_accuracy": 0.7916343919442292, "eval_f1_macro": 0.6110606025775643, "eval_f1_micro": 0.7916343919442292, "eval_f1_weighted": 0.7817623460591858, "eval_loss": 0.660524845123291, "eval_macro_fpr": 0.01915789146680066, "eval_macro_sensitivity": 0.6358134270226833, "eval_macro_specificity": 0.984380207900859, "eval_precision": 0.7769679723590022, "eval_precision_macro": 0.5964718375735727, "eval_recall": 0.7916343919442292, "eval_recall_macro": 0.6358134270226833, "eval_runtime": 44.1283, "eval_samples_per_second": 29.256, "eval_steps_per_second": 3.671, "eval_weighted_fpr": 0.01845372847636688, "eval_weighted_sensitivity": 0.7916343919442292, "eval_weighted_specificity": 0.9740687265686558, "step": 2089 }, { "epoch": 14.0, "eval_accuracy": 0.790859798605732, "eval_f1_macro": 0.6261172643852387, "eval_f1_micro": 0.790859798605732, "eval_f1_weighted": 0.780302820536599, "eval_loss": 0.6614473462104797, "eval_macro_fpr": 0.019344545099537428, "eval_macro_sensitivity": 0.6477733385910524, "eval_macro_specificity": 0.9842490309995476, "eval_precision": 0.7794397894982683, "eval_precision_macro": 0.6367821774875876, "eval_recall": 0.790859798605732, "eval_recall_macro": 0.6477733385910524, "eval_runtime": 52.6504, "eval_samples_per_second": 24.52, "eval_steps_per_second": 3.077, "eval_weighted_fpr": 0.018538862949739082, "eval_weighted_sensitivity": 0.790859798605732, "eval_weighted_specificity": 0.9728756663874838, "step": 2250 } ], "logging_steps": 500, "max_steps": 2400, "num_train_epochs": 15, "save_steps": 500, "total_flos": 2.278788590234419e+16, "trial_name": null, "trial_params": null }