{ "best_metric": 0.5316254099721903, "best_model_checkpoint": "InLegalBERT-lora/checkpoint-964", "epoch": 5.996889580093312, "eval_steps": 500, "global_step": 964, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.6553059643687065, "eval_f1_macro": 0.34196434919671853, "eval_f1_micro": 0.6553059643687065, "eval_f1_weighted": 0.6146575775654787, "eval_loss": 1.2012524604797363, "eval_macro_fpr": 0.036531607457408626, "eval_macro_sensitivity": 0.39029268516816945, "eval_macro_specificity": 0.9740627875145957, "eval_precision": 0.6007307052856502, "eval_precision_macro": 0.32788772117271575, "eval_recall": 0.6553059643687065, "eval_recall_macro": 0.39029268516816945, "eval_runtime": 30.3344, "eval_samples_per_second": 42.559, "eval_steps_per_second": 5.34, "eval_weighted_fpr": 0.03621124582960371, "eval_weighted_sensitivity": 0.6553059643687065, "eval_weighted_specificity": 0.9556358483502301, "step": 160 }, { "epoch": 2.0, "eval_accuracy": 0.7381874515879163, "eval_f1_macro": 0.4250111578260666, "eval_f1_micro": 0.7381874515879164, "eval_f1_weighted": 0.7236865886821344, "eval_loss": 0.8278939127922058, "eval_macro_fpr": 0.024763530819684316, "eval_macro_sensitivity": 0.46578072689552413, "eval_macro_specificity": 0.9806295017830671, "eval_precision": 0.7211273477007717, "eval_precision_macro": 0.40923635739063985, "eval_recall": 0.7381874515879163, "eval_recall_macro": 0.46578072689552413, "eval_runtime": 34.091, "eval_samples_per_second": 37.869, "eval_steps_per_second": 4.752, "eval_weighted_fpr": 0.024707602339181286, "eval_weighted_sensitivity": 0.7381874515879163, "eval_weighted_specificity": 0.9712550751580882, "step": 321 }, { "epoch": 3.0, "eval_accuracy": 0.7544539116963594, "eval_f1_macro": 0.44305220236653187, "eval_f1_micro": 0.7544539116963594, "eval_f1_weighted": 0.7304902543811719, "eval_loss": 0.713018000125885, "eval_macro_fpr": 0.0233195243156939, "eval_macro_sensitivity": 0.4769897256873969, "eval_macro_specificity": 0.9816367201302573, "eval_precision": 0.7255238407846915, "eval_precision_macro": 0.4800443784048848, "eval_recall": 0.7544539116963594, "eval_recall_macro": 0.4769897256873969, "eval_runtime": 32.6151, "eval_samples_per_second": 39.583, "eval_steps_per_second": 4.967, "eval_weighted_fpr": 0.02271912850283093, "eval_weighted_sensitivity": 0.7544539116963594, "eval_weighted_specificity": 0.9700968902575, "step": 482 }, { "epoch": 3.11, "learning_rate": 3.958333333333333e-05, "loss": 1.1985, "step": 500 }, { "epoch": 4.0, "eval_accuracy": 0.7823392718822618, "eval_f1_macro": 0.5047859025633034, "eval_f1_micro": 0.7823392718822618, "eval_f1_weighted": 0.766027283346833, "eval_loss": 0.6922410726547241, "eval_macro_fpr": 0.02001637486004151, "eval_macro_sensitivity": 0.528327896933921, "eval_macro_specificity": 0.9837585704961105, "eval_precision": 0.7594430092765442, "eval_precision_macro": 0.5188076394331661, "eval_recall": 0.7823392718822618, "eval_recall_macro": 0.528327896933921, "eval_runtime": 32.5532, "eval_samples_per_second": 39.658, "eval_steps_per_second": 4.976, "eval_weighted_fpr": 0.019485472574717427, "eval_weighted_sensitivity": 0.7823392718822618, "eval_weighted_specificity": 0.9740392855593933, "step": 643 }, { "epoch": 5.0, "eval_accuracy": 0.7939581719597212, "eval_f1_macro": 0.5257108179174788, "eval_f1_micro": 0.7939581719597211, "eval_f1_weighted": 0.7717932414170925, "eval_loss": 0.6710420846939087, "eval_macro_fpr": 0.018964580711785816, "eval_macro_sensitivity": 0.5571328425020213, "eval_macro_specificity": 0.9845265708178329, "eval_precision": 0.7734327517428056, "eval_precision_macro": 0.5449998556573111, "eval_recall": 0.7939581719597212, "eval_recall_macro": 0.5571328425020213, "eval_runtime": 33.235, "eval_samples_per_second": 38.845, "eval_steps_per_second": 4.874, "eval_weighted_fpr": 0.018199233716475097, "eval_weighted_sensitivity": 0.7939581719597212, "eval_weighted_specificity": 0.9739403903077732, "step": 803 }, { "epoch": 6.0, "eval_accuracy": 0.7970565453137103, "eval_f1_macro": 0.5316254099721903, "eval_f1_micro": 0.7970565453137104, "eval_f1_weighted": 0.7789523196246046, "eval_loss": 0.6454855799674988, "eval_macro_fpr": 0.018368947118040532, "eval_macro_sensitivity": 0.5622105847462606, "eval_macro_specificity": 0.9848273693754934, "eval_precision": 0.7756987894676903, "eval_precision_macro": 0.5353415355904975, "eval_recall": 0.7970565453137103, "eval_recall_macro": 0.5622105847462606, "eval_runtime": 33.0425, "eval_samples_per_second": 39.071, "eval_steps_per_second": 4.903, "eval_weighted_fpr": 0.017862012544314153, "eval_weighted_sensitivity": 0.7970565453137103, "eval_weighted_specificity": 0.9753539953186898, "step": 964 } ], "logging_steps": 500, "max_steps": 2400, "num_train_epochs": 15, "save_steps": 500, "total_flos": 8366917304180736.0, "trial_name": null, "trial_params": null }