{ "best_metric": 0.6372154277689757, "best_model_checkpoint": "InLegalBERT-lora/checkpoint-1929", "epoch": 12.0, "eval_steps": 500, "global_step": 1929, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.6553059643687065, "eval_f1_macro": 0.34196434919671853, "eval_f1_micro": 0.6553059643687065, "eval_f1_weighted": 0.6146575775654787, "eval_loss": 1.2012524604797363, "eval_macro_fpr": 0.036531607457408626, "eval_macro_sensitivity": 0.39029268516816945, "eval_macro_specificity": 0.9740627875145957, "eval_precision": 0.6007307052856502, "eval_precision_macro": 0.32788772117271575, "eval_recall": 0.6553059643687065, "eval_recall_macro": 0.39029268516816945, "eval_runtime": 30.3344, "eval_samples_per_second": 42.559, "eval_steps_per_second": 5.34, "eval_weighted_fpr": 0.03621124582960371, "eval_weighted_sensitivity": 0.6553059643687065, "eval_weighted_specificity": 0.9556358483502301, "step": 160 }, { "epoch": 2.0, "eval_accuracy": 0.7381874515879163, "eval_f1_macro": 0.4250111578260666, "eval_f1_micro": 0.7381874515879164, "eval_f1_weighted": 0.7236865886821344, "eval_loss": 0.8278939127922058, "eval_macro_fpr": 0.024763530819684316, "eval_macro_sensitivity": 0.46578072689552413, "eval_macro_specificity": 0.9806295017830671, "eval_precision": 0.7211273477007717, "eval_precision_macro": 0.40923635739063985, "eval_recall": 0.7381874515879163, "eval_recall_macro": 0.46578072689552413, "eval_runtime": 34.091, "eval_samples_per_second": 37.869, "eval_steps_per_second": 4.752, "eval_weighted_fpr": 0.024707602339181286, "eval_weighted_sensitivity": 0.7381874515879163, "eval_weighted_specificity": 0.9712550751580882, "step": 321 }, { "epoch": 3.0, "eval_accuracy": 0.7544539116963594, "eval_f1_macro": 0.44305220236653187, "eval_f1_micro": 0.7544539116963594, "eval_f1_weighted": 0.7304902543811719, "eval_loss": 0.713018000125885, "eval_macro_fpr": 0.0233195243156939, "eval_macro_sensitivity": 0.4769897256873969, "eval_macro_specificity": 0.9816367201302573, "eval_precision": 0.7255238407846915, "eval_precision_macro": 0.4800443784048848, "eval_recall": 0.7544539116963594, "eval_recall_macro": 0.4769897256873969, "eval_runtime": 32.6151, "eval_samples_per_second": 39.583, "eval_steps_per_second": 4.967, "eval_weighted_fpr": 0.02271912850283093, "eval_weighted_sensitivity": 0.7544539116963594, "eval_weighted_specificity": 0.9700968902575, "step": 482 }, { "epoch": 3.11, "learning_rate": 3.958333333333333e-05, "loss": 1.1985, "step": 500 }, { "epoch": 4.0, "eval_accuracy": 0.7823392718822618, "eval_f1_macro": 0.5047859025633034, "eval_f1_micro": 0.7823392718822618, "eval_f1_weighted": 0.766027283346833, "eval_loss": 0.6922410726547241, "eval_macro_fpr": 0.02001637486004151, "eval_macro_sensitivity": 0.528327896933921, "eval_macro_specificity": 0.9837585704961105, "eval_precision": 0.7594430092765442, "eval_precision_macro": 0.5188076394331661, "eval_recall": 0.7823392718822618, "eval_recall_macro": 0.528327896933921, "eval_runtime": 32.5532, "eval_samples_per_second": 39.658, "eval_steps_per_second": 4.976, "eval_weighted_fpr": 0.019485472574717427, "eval_weighted_sensitivity": 0.7823392718822618, "eval_weighted_specificity": 0.9740392855593933, "step": 643 }, { "epoch": 5.0, "eval_accuracy": 0.7939581719597212, "eval_f1_macro": 0.5257108179174788, "eval_f1_micro": 0.7939581719597211, "eval_f1_weighted": 0.7717932414170925, "eval_loss": 0.6710420846939087, "eval_macro_fpr": 0.018964580711785816, "eval_macro_sensitivity": 0.5571328425020213, "eval_macro_specificity": 0.9845265708178329, "eval_precision": 0.7734327517428056, "eval_precision_macro": 0.5449998556573111, "eval_recall": 0.7939581719597212, "eval_recall_macro": 0.5571328425020213, "eval_runtime": 33.235, "eval_samples_per_second": 38.845, "eval_steps_per_second": 4.874, "eval_weighted_fpr": 0.018199233716475097, "eval_weighted_sensitivity": 0.7939581719597212, "eval_weighted_specificity": 0.9739403903077732, "step": 803 }, { "epoch": 6.0, "eval_accuracy": 0.7970565453137103, "eval_f1_macro": 0.5316254099721903, "eval_f1_micro": 0.7970565453137104, "eval_f1_weighted": 0.7789523196246046, "eval_loss": 0.6454855799674988, "eval_macro_fpr": 0.018368947118040532, "eval_macro_sensitivity": 0.5622105847462606, "eval_macro_specificity": 0.9848273693754934, "eval_precision": 0.7756987894676903, "eval_precision_macro": 0.5353415355904975, "eval_recall": 0.7970565453137103, "eval_recall_macro": 0.5622105847462606, "eval_runtime": 33.0425, "eval_samples_per_second": 39.071, "eval_steps_per_second": 4.903, "eval_weighted_fpr": 0.017862012544314153, "eval_weighted_sensitivity": 0.7970565453137103, "eval_weighted_specificity": 0.9753539953186898, "step": 964 }, { "epoch": 6.22, "learning_rate": 2.916666666666667e-05, "loss": 0.5721, "step": 1000 }, { "epoch": 7.0, "eval_accuracy": 0.8001549186676995, "eval_f1_macro": 0.5486067787470349, "eval_f1_micro": 0.8001549186676995, "eval_f1_weighted": 0.7845126172395842, "eval_loss": 0.6394562721252441, "eval_macro_fpr": 0.01807650265580631, "eval_macro_sensitivity": 0.5784319115133939, "eval_macro_specificity": 0.9850891561725063, "eval_precision": 0.7801018097427485, "eval_precision_macro": 0.5442815357986059, "eval_recall": 0.8001549186676995, "eval_recall_macro": 0.5784319115133939, "eval_runtime": 32.9727, "eval_samples_per_second": 39.154, "eval_steps_per_second": 4.913, "eval_weighted_fpr": 0.017527173913043478, "eval_weighted_sensitivity": 0.8001549186676995, "eval_weighted_specificity": 0.9761824239198935, "step": 1125 }, { "epoch": 8.0, "eval_accuracy": 0.8024786986831913, "eval_f1_macro": 0.5474570084709011, "eval_f1_micro": 0.8024786986831914, "eval_f1_weighted": 0.787386582262622, "eval_loss": 0.6317066550254822, "eval_macro_fpr": 0.017822080148589308, "eval_macro_sensitivity": 0.5773035410379497, "eval_macro_specificity": 0.9852623885220758, "eval_precision": 0.783268466071204, "eval_precision_macro": 0.5438628735250125, "eval_recall": 0.8024786986831913, "eval_recall_macro": 0.5773035410379497, "eval_runtime": 33.0187, "eval_samples_per_second": 39.099, "eval_steps_per_second": 4.906, "eval_weighted_fpr": 0.017277593332881633, "eval_weighted_sensitivity": 0.8024786986831913, "eval_weighted_specificity": 0.9764571291479465, "step": 1286 }, { "epoch": 9.0, "eval_accuracy": 0.8009295120061968, "eval_f1_macro": 0.5609368334662593, "eval_f1_micro": 0.8009295120061968, "eval_f1_weighted": 0.7875081013739925, "eval_loss": 0.6136514544487, "eval_macro_fpr": 0.017931645431496272, "eval_macro_sensitivity": 0.5841960959288544, "eval_macro_specificity": 0.985161694874728, "eval_precision": 0.7827917488346946, "eval_precision_macro": 0.5593054718395108, "eval_recall": 0.8009295120061968, "eval_recall_macro": 0.5841960959288544, "eval_runtime": 33.7216, "eval_samples_per_second": 38.284, "eval_steps_per_second": 4.804, "eval_weighted_fpr": 0.017443833570895267, "eval_weighted_sensitivity": 0.8009295120061968, "eval_weighted_specificity": 0.9764959111147221, "step": 1446 }, { "epoch": 9.33, "learning_rate": 1.8750000000000002e-05, "loss": 0.4166, "step": 1500 }, { "epoch": 10.0, "eval_accuracy": 0.8156467854376452, "eval_f1_macro": 0.6305053806449583, "eval_f1_micro": 0.8156467854376452, "eval_f1_weighted": 0.8066651282863864, "eval_loss": 0.6248635649681091, "eval_macro_fpr": 0.016463869736407642, "eval_macro_sensitivity": 0.6430050326236179, "eval_macro_specificity": 0.9861908495694477, "eval_precision": 0.8054630087428596, "eval_precision_macro": 0.639776904615918, "eval_recall": 0.8156467854376452, "eval_recall_macro": 0.6430050326236179, "eval_runtime": 33.5965, "eval_samples_per_second": 38.427, "eval_steps_per_second": 4.822, "eval_weighted_fpr": 0.01588785046728972, "eval_weighted_sensitivity": 0.8156467854376452, "eval_weighted_specificity": 0.9772159581040682, "step": 1607 }, { "epoch": 11.0, "eval_accuracy": 0.8125484120836561, "eval_f1_macro": 0.6371983241862614, "eval_f1_micro": 0.8125484120836561, "eval_f1_weighted": 0.8042305582147614, "eval_loss": 0.642641544342041, "eval_macro_fpr": 0.016876700974845713, "eval_macro_sensitivity": 0.6520338532213917, "eval_macro_specificity": 0.9859193883690203, "eval_precision": 0.8013591068710365, "eval_precision_macro": 0.6397179331634546, "eval_recall": 0.8125484120836561, "eval_recall_macro": 0.6520338532213917, "eval_runtime": 33.85, "eval_samples_per_second": 38.139, "eval_steps_per_second": 4.786, "eval_weighted_fpr": 0.016211146838156484, "eval_weighted_sensitivity": 0.8125484120836561, "eval_weighted_specificity": 0.9762424134516496, "step": 1768 }, { "epoch": 12.0, "eval_accuracy": 0.8164213787761425, "eval_f1_macro": 0.6372154277689757, "eval_f1_micro": 0.8164213787761425, "eval_f1_weighted": 0.8082672837501724, "eval_loss": 0.6305465698242188, "eval_macro_fpr": 0.016428781045237314, "eval_macro_sensitivity": 0.6526108250586471, "eval_macro_specificity": 0.9862261630603141, "eval_precision": 0.8050297561179627, "eval_precision_macro": 0.635785837139922, "eval_recall": 0.8164213787761425, "eval_recall_macro": 0.6526108250586471, "eval_runtime": 33.9194, "eval_samples_per_second": 38.061, "eval_steps_per_second": 4.776, "eval_weighted_fpr": 0.01580737677582872, "eval_weighted_sensitivity": 0.8164213787761425, "eval_weighted_specificity": 0.9769710671285662, "step": 1929 } ], "logging_steps": 500, "max_steps": 2400, "num_train_epochs": 15, "save_steps": 500, "total_flos": 1.6733834608361472e+16, "trial_name": null, "trial_params": null }