File size: 5,781 Bytes
b61d552
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
{
  "best_metric": 0.5316254099721903,
  "best_model_checkpoint": "InLegalBERT-lora/checkpoint-964",
  "epoch": 5.996889580093312,
  "eval_steps": 500,
  "global_step": 964,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.0,
      "eval_accuracy": 0.6553059643687065,
      "eval_f1_macro": 0.34196434919671853,
      "eval_f1_micro": 0.6553059643687065,
      "eval_f1_weighted": 0.6146575775654787,
      "eval_loss": 1.2012524604797363,
      "eval_macro_fpr": 0.036531607457408626,
      "eval_macro_sensitivity": 0.39029268516816945,
      "eval_macro_specificity": 0.9740627875145957,
      "eval_precision": 0.6007307052856502,
      "eval_precision_macro": 0.32788772117271575,
      "eval_recall": 0.6553059643687065,
      "eval_recall_macro": 0.39029268516816945,
      "eval_runtime": 30.3344,
      "eval_samples_per_second": 42.559,
      "eval_steps_per_second": 5.34,
      "eval_weighted_fpr": 0.03621124582960371,
      "eval_weighted_sensitivity": 0.6553059643687065,
      "eval_weighted_specificity": 0.9556358483502301,
      "step": 160
    },
    {
      "epoch": 2.0,
      "eval_accuracy": 0.7381874515879163,
      "eval_f1_macro": 0.4250111578260666,
      "eval_f1_micro": 0.7381874515879164,
      "eval_f1_weighted": 0.7236865886821344,
      "eval_loss": 0.8278939127922058,
      "eval_macro_fpr": 0.024763530819684316,
      "eval_macro_sensitivity": 0.46578072689552413,
      "eval_macro_specificity": 0.9806295017830671,
      "eval_precision": 0.7211273477007717,
      "eval_precision_macro": 0.40923635739063985,
      "eval_recall": 0.7381874515879163,
      "eval_recall_macro": 0.46578072689552413,
      "eval_runtime": 34.091,
      "eval_samples_per_second": 37.869,
      "eval_steps_per_second": 4.752,
      "eval_weighted_fpr": 0.024707602339181286,
      "eval_weighted_sensitivity": 0.7381874515879163,
      "eval_weighted_specificity": 0.9712550751580882,
      "step": 321
    },
    {
      "epoch": 3.0,
      "eval_accuracy": 0.7544539116963594,
      "eval_f1_macro": 0.44305220236653187,
      "eval_f1_micro": 0.7544539116963594,
      "eval_f1_weighted": 0.7304902543811719,
      "eval_loss": 0.713018000125885,
      "eval_macro_fpr": 0.0233195243156939,
      "eval_macro_sensitivity": 0.4769897256873969,
      "eval_macro_specificity": 0.9816367201302573,
      "eval_precision": 0.7255238407846915,
      "eval_precision_macro": 0.4800443784048848,
      "eval_recall": 0.7544539116963594,
      "eval_recall_macro": 0.4769897256873969,
      "eval_runtime": 32.6151,
      "eval_samples_per_second": 39.583,
      "eval_steps_per_second": 4.967,
      "eval_weighted_fpr": 0.02271912850283093,
      "eval_weighted_sensitivity": 0.7544539116963594,
      "eval_weighted_specificity": 0.9700968902575,
      "step": 482
    },
    {
      "epoch": 3.11,
      "learning_rate": 3.958333333333333e-05,
      "loss": 1.1985,
      "step": 500
    },
    {
      "epoch": 4.0,
      "eval_accuracy": 0.7823392718822618,
      "eval_f1_macro": 0.5047859025633034,
      "eval_f1_micro": 0.7823392718822618,
      "eval_f1_weighted": 0.766027283346833,
      "eval_loss": 0.6922410726547241,
      "eval_macro_fpr": 0.02001637486004151,
      "eval_macro_sensitivity": 0.528327896933921,
      "eval_macro_specificity": 0.9837585704961105,
      "eval_precision": 0.7594430092765442,
      "eval_precision_macro": 0.5188076394331661,
      "eval_recall": 0.7823392718822618,
      "eval_recall_macro": 0.528327896933921,
      "eval_runtime": 32.5532,
      "eval_samples_per_second": 39.658,
      "eval_steps_per_second": 4.976,
      "eval_weighted_fpr": 0.019485472574717427,
      "eval_weighted_sensitivity": 0.7823392718822618,
      "eval_weighted_specificity": 0.9740392855593933,
      "step": 643
    },
    {
      "epoch": 5.0,
      "eval_accuracy": 0.7939581719597212,
      "eval_f1_macro": 0.5257108179174788,
      "eval_f1_micro": 0.7939581719597211,
      "eval_f1_weighted": 0.7717932414170925,
      "eval_loss": 0.6710420846939087,
      "eval_macro_fpr": 0.018964580711785816,
      "eval_macro_sensitivity": 0.5571328425020213,
      "eval_macro_specificity": 0.9845265708178329,
      "eval_precision": 0.7734327517428056,
      "eval_precision_macro": 0.5449998556573111,
      "eval_recall": 0.7939581719597212,
      "eval_recall_macro": 0.5571328425020213,
      "eval_runtime": 33.235,
      "eval_samples_per_second": 38.845,
      "eval_steps_per_second": 4.874,
      "eval_weighted_fpr": 0.018199233716475097,
      "eval_weighted_sensitivity": 0.7939581719597212,
      "eval_weighted_specificity": 0.9739403903077732,
      "step": 803
    },
    {
      "epoch": 6.0,
      "eval_accuracy": 0.7970565453137103,
      "eval_f1_macro": 0.5316254099721903,
      "eval_f1_micro": 0.7970565453137104,
      "eval_f1_weighted": 0.7789523196246046,
      "eval_loss": 0.6454855799674988,
      "eval_macro_fpr": 0.018368947118040532,
      "eval_macro_sensitivity": 0.5622105847462606,
      "eval_macro_specificity": 0.9848273693754934,
      "eval_precision": 0.7756987894676903,
      "eval_precision_macro": 0.5353415355904975,
      "eval_recall": 0.7970565453137103,
      "eval_recall_macro": 0.5622105847462606,
      "eval_runtime": 33.0425,
      "eval_samples_per_second": 39.071,
      "eval_steps_per_second": 4.903,
      "eval_weighted_fpr": 0.017862012544314153,
      "eval_weighted_sensitivity": 0.7970565453137103,
      "eval_weighted_specificity": 0.9753539953186898,
      "step": 964
    }
  ],
  "logging_steps": 500,
  "max_steps": 2400,
  "num_train_epochs": 15,
  "save_steps": 500,
  "total_flos": 8366917304180736.0,
  "trial_name": null,
  "trial_params": null
}