xshubhamx commited on
Commit
94e184b
·
verified ·
1 Parent(s): 50a2d98

Upload folder using huggingface_hub

Browse files
training_checkpoints/checkpoint-1125/adapter_config.json CHANGED
@@ -21,8 +21,8 @@
21
  "revision": null,
22
  "target_modules": [
23
  "key",
24
- "dense",
25
  "value",
 
26
  "query"
27
  ],
28
  "task_type": "SEQ_CLS",
 
21
  "revision": null,
22
  "target_modules": [
23
  "key",
 
24
  "value",
25
+ "dense",
26
  "query"
27
  ],
28
  "task_type": "SEQ_CLS",
training_checkpoints/checkpoint-1125/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:751c058d328d5bced7fcc3d8c590845b12aedffec849ef6e36b8f6b80509dc4a
3
  size 104549068
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca6b02a5f83d3d6b2bbc636ee862fc1d6896a112b391969b1379ff2a2cc6774f
3
  size 104549068
training_checkpoints/checkpoint-1125/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51a34afa9448b5e619706a6ed419f14e3795ce9f674a26cbaa0a541d5dedec9c
3
  size 21646778
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a285e2020d2e294d6d26b5d7bc54971b751e4a19b4dfb1e292413766f04ab231
3
  size 21646778
training_checkpoints/checkpoint-1125/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20a6fea19f4fba60504f25e5a88ef9ff2e0562d058598a10a7b8423ea5b6c595
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40224493aacf0cd0f7038028ae3514743b7f864ad570d1dd323ebd02caa1c08b
3
  size 1064
training_checkpoints/checkpoint-1125/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.4555893583613109,
3
  "best_model_checkpoint": "legal-bert-lora/checkpoint-1125",
4
  "epoch": 6.998444790046657,
5
  "eval_steps": 500,
@@ -10,174 +10,174 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.6297443841982959,
14
- "eval_f1_macro": 0.274206359888179,
15
- "eval_f1_micro": 0.6297443841982959,
16
- "eval_f1_weighted": 0.5693924444438366,
17
- "eval_loss": 1.3252344131469727,
18
- "eval_macro_fpr": 0.04170202326759921,
19
- "eval_macro_sensitivity": 0.31095312319919677,
20
- "eval_macro_specificity": 0.9716859606487191,
21
- "eval_precision": 0.5643117258906628,
22
- "eval_precision_macro": 0.2864620870649182,
23
- "eval_recall": 0.6297443841982959,
24
- "eval_recall_macro": 0.31095312319919677,
25
- "eval_runtime": 29.2455,
26
- "eval_samples_per_second": 44.143,
27
- "eval_steps_per_second": 5.539,
28
- "eval_weighted_fpr": 0.0403035413153457,
29
- "eval_weighted_sensitivity": 0.6297443841982959,
30
- "eval_weighted_specificity": 0.945545025532491,
31
  "step": 160
32
  },
33
  {
34
  "epoch": 2.0,
35
- "eval_accuracy": 0.7312161115414407,
36
- "eval_f1_macro": 0.39668888106795264,
37
- "eval_f1_micro": 0.7312161115414407,
38
- "eval_f1_weighted": 0.6996238601563893,
39
- "eval_loss": 0.8870222568511963,
40
- "eval_macro_fpr": 0.025654492164758257,
41
- "eval_macro_sensitivity": 0.4525442260434048,
42
- "eval_macro_specificity": 0.9800113592544849,
43
- "eval_precision": 0.687310022738013,
44
- "eval_precision_macro": 0.37417463878901125,
45
- "eval_recall": 0.7312161115414407,
46
- "eval_recall_macro": 0.4525442260434048,
47
- "eval_runtime": 31.4769,
48
- "eval_samples_per_second": 41.014,
49
- "eval_steps_per_second": 5.147,
50
- "eval_weighted_fpr": 0.025584310255843103,
51
- "eval_weighted_sensitivity": 0.7312161115414407,
52
- "eval_weighted_specificity": 0.9689542772758329,
53
  "step": 321
54
  },
55
  {
56
  "epoch": 3.0,
57
- "eval_accuracy": 0.7482571649883811,
58
- "eval_f1_macro": 0.4262450946907797,
59
- "eval_f1_micro": 0.7482571649883811,
60
- "eval_f1_weighted": 0.7282078768513273,
61
- "eval_loss": 0.7794041037559509,
62
- "eval_macro_fpr": 0.023941075707085962,
63
- "eval_macro_sensitivity": 0.46803400264857875,
64
- "eval_macro_specificity": 0.9812882861560729,
65
- "eval_precision": 0.716881212213352,
66
- "eval_precision_macro": 0.40594566191566384,
67
- "eval_recall": 0.7482571649883811,
68
- "eval_recall_macro": 0.46803400264857875,
69
- "eval_runtime": 31.9176,
70
- "eval_samples_per_second": 40.448,
71
- "eval_steps_per_second": 5.076,
72
- "eval_weighted_fpr": 0.02346739836811322,
73
- "eval_weighted_sensitivity": 0.7482571649883811,
74
- "eval_weighted_specificity": 0.9710671273527125,
75
  "step": 482
76
  },
77
  {
78
  "epoch": 3.11,
79
- "learning_rate": 3.4375e-05,
80
- "loss": 1.2835,
81
  "step": 500
82
  },
83
  {
84
  "epoch": 4.0,
85
- "eval_accuracy": 0.7443841982958946,
86
- "eval_f1_macro": 0.4099967964216515,
87
- "eval_f1_micro": 0.7443841982958946,
88
- "eval_f1_weighted": 0.7145941103131069,
89
- "eval_loss": 0.7480739951133728,
90
- "eval_macro_fpr": 0.024347730036769315,
91
- "eval_macro_sensitivity": 0.45879715060247334,
92
- "eval_macro_specificity": 0.9809610383366641,
93
- "eval_precision": 0.7084810945380595,
94
- "eval_precision_macro": 0.39966194371515146,
95
- "eval_recall": 0.7443841982958946,
96
- "eval_recall_macro": 0.45879715060247334,
97
- "eval_runtime": 31.4007,
98
- "eval_samples_per_second": 41.114,
99
- "eval_steps_per_second": 5.159,
100
- "eval_weighted_fpr": 0.023940800928612886,
101
- "eval_weighted_sensitivity": 0.7443841982958946,
102
- "eval_weighted_specificity": 0.9700313767540658,
103
  "step": 643
104
  },
105
  {
106
  "epoch": 5.0,
107
- "eval_accuracy": 0.7629744384198296,
108
- "eval_f1_macro": 0.43501781058601113,
109
- "eval_f1_micro": 0.7629744384198296,
110
- "eval_f1_weighted": 0.7371758021368604,
111
- "eval_loss": 0.7360239624977112,
112
- "eval_macro_fpr": 0.022582062196490615,
113
- "eval_macro_sensitivity": 0.4763281068994499,
114
- "eval_macro_specificity": 0.9822126782492226,
115
- "eval_precision": 0.7245041319757508,
116
- "eval_precision_macro": 0.4175606064626592,
117
- "eval_recall": 0.7629744384198296,
118
- "eval_recall_macro": 0.4763281068994499,
119
- "eval_runtime": 31.4819,
120
- "eval_samples_per_second": 41.008,
121
- "eval_steps_per_second": 5.146,
122
- "eval_weighted_fpr": 0.021708286038592508,
123
- "eval_weighted_sensitivity": 0.7629744384198296,
124
- "eval_weighted_specificity": 0.9702157353185087,
125
  "step": 803
126
  },
127
  {
128
  "epoch": 6.0,
129
- "eval_accuracy": 0.7738187451587917,
130
- "eval_f1_macro": 0.45136434049983454,
131
- "eval_f1_micro": 0.7738187451587917,
132
- "eval_f1_weighted": 0.7549277434298373,
133
- "eval_loss": 0.7146413922309875,
134
- "eval_macro_fpr": 0.020909390992017808,
135
- "eval_macro_sensitivity": 0.49065578942391963,
136
- "eval_macro_specificity": 0.9831195609570588,
137
- "eval_precision": 0.7789833226684362,
138
- "eval_precision_macro": 0.5020078701673053,
139
- "eval_recall": 0.7738187451587917,
140
- "eval_recall_macro": 0.49065578942391963,
141
- "eval_runtime": 31.935,
142
- "eval_samples_per_second": 40.426,
143
- "eval_steps_per_second": 5.073,
144
- "eval_weighted_fpr": 0.020451043563524302,
145
- "eval_weighted_sensitivity": 0.7738187451587917,
146
- "eval_weighted_specificity": 0.9729746691970887,
147
  "step": 964
148
  },
149
  {
150
  "epoch": 6.22,
151
- "learning_rate": 1.8750000000000002e-05,
152
- "loss": 0.6494,
153
  "step": 1000
154
  },
155
  {
156
  "epoch": 7.0,
157
- "eval_accuracy": 0.7606506584043378,
158
- "eval_f1_macro": 0.4555893583613109,
159
- "eval_f1_micro": 0.7606506584043377,
160
- "eval_f1_weighted": 0.739017992628783,
161
- "eval_loss": 0.7362409234046936,
162
- "eval_macro_fpr": 0.022493653031422953,
163
- "eval_macro_sensitivity": 0.4889578896745981,
164
- "eval_macro_specificity": 0.9822020479931979,
165
- "eval_precision": 0.7519338544853175,
166
- "eval_precision_macro": 0.5232191620367644,
167
- "eval_recall": 0.7606506584043378,
168
- "eval_recall_macro": 0.4889578896745981,
169
- "eval_runtime": 31.5363,
170
- "eval_samples_per_second": 40.937,
171
- "eval_steps_per_second": 5.137,
172
- "eval_weighted_fpr": 0.021981930710677954,
173
- "eval_weighted_sensitivity": 0.7606506584043378,
174
- "eval_weighted_specificity": 0.9723800614936304,
175
  "step": 1125
176
  }
177
  ],
178
  "logging_steps": 500,
179
- "max_steps": 1600,
180
- "num_train_epochs": 10,
181
  "save_steps": 500,
182
  "total_flos": 9761403521544192.0,
183
  "trial_name": null,
 
1
  {
2
+ "best_metric": 0.6191969834738721,
3
  "best_model_checkpoint": "legal-bert-lora/checkpoint-1125",
4
  "epoch": 6.998444790046657,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.6374903175832688,
14
+ "eval_f1_macro": 0.3394539856434376,
15
+ "eval_f1_micro": 0.6374903175832688,
16
+ "eval_f1_weighted": 0.5765523433851403,
17
+ "eval_loss": 1.3127473592758179,
18
+ "eval_macro_fpr": 0.040137717078130394,
19
+ "eval_macro_sensitivity": 0.4017115530536667,
20
+ "eval_macro_specificity": 0.9725650393599338,
21
+ "eval_precision": 0.5466227876047401,
22
+ "eval_precision_macro": 0.31141306924471374,
23
+ "eval_recall": 0.6374903175832688,
24
+ "eval_recall_macro": 0.4017115530536667,
25
+ "eval_runtime": 44.4128,
26
+ "eval_samples_per_second": 29.068,
27
+ "eval_steps_per_second": 3.648,
28
+ "eval_weighted_fpr": 0.0390325271059216,
29
+ "eval_weighted_sensitivity": 0.6374903175832688,
30
+ "eval_weighted_specificity": 0.950985272815738,
31
  "step": 160
32
  },
33
  {
34
  "epoch": 2.0,
35
+ "eval_accuracy": 0.7273431448489543,
36
+ "eval_f1_macro": 0.3969800602789428,
37
+ "eval_f1_micro": 0.7273431448489543,
38
+ "eval_f1_weighted": 0.6960627383550935,
39
+ "eval_loss": 0.8160030841827393,
40
+ "eval_macro_fpr": 0.026417996388603746,
41
+ "eval_macro_sensitivity": 0.450135625445356,
42
+ "eval_macro_specificity": 0.9796396430402219,
43
+ "eval_precision": 0.6997929823446861,
44
+ "eval_precision_macro": 0.39453164470926966,
45
+ "eval_recall": 0.7273431448489543,
46
+ "eval_recall_macro": 0.450135625445356,
47
+ "eval_runtime": 34.3148,
48
+ "eval_samples_per_second": 37.622,
49
+ "eval_steps_per_second": 4.721,
50
+ "eval_weighted_fpr": 0.026077937472218107,
51
+ "eval_weighted_sensitivity": 0.7273431448489543,
52
+ "eval_weighted_specificity": 0.9672515007543734,
53
  "step": 321
54
  },
55
  {
56
  "epoch": 3.0,
57
+ "eval_accuracy": 0.7443841982958946,
58
+ "eval_f1_macro": 0.4210575074216338,
59
+ "eval_f1_micro": 0.7443841982958946,
60
+ "eval_f1_weighted": 0.7223603623418946,
61
+ "eval_loss": 0.7322217226028442,
62
+ "eval_macro_fpr": 0.024451015698283406,
63
+ "eval_macro_sensitivity": 0.46251578703813245,
64
+ "eval_macro_specificity": 0.9809603839363172,
65
+ "eval_precision": 0.711002444877192,
66
+ "eval_precision_macro": 0.4030436676815596,
67
+ "eval_recall": 0.7443841982958946,
68
+ "eval_recall_macro": 0.46251578703813245,
69
+ "eval_runtime": 32.8708,
70
+ "eval_samples_per_second": 39.275,
71
+ "eval_steps_per_second": 4.928,
72
+ "eval_weighted_fpr": 0.023940800928612886,
73
+ "eval_weighted_sensitivity": 0.7443841982958946,
74
+ "eval_weighted_specificity": 0.9700215607488639,
75
  "step": 482
76
  },
77
  {
78
  "epoch": 3.11,
79
+ "learning_rate": 3.958333333333333e-05,
80
+ "loss": 1.2229,
81
  "step": 500
82
  },
83
  {
84
  "epoch": 4.0,
85
+ "eval_accuracy": 0.7536793183578622,
86
+ "eval_f1_macro": 0.46141164864389705,
87
+ "eval_f1_micro": 0.7536793183578622,
88
+ "eval_f1_weighted": 0.7337325056665881,
89
+ "eval_loss": 0.7034952640533447,
90
+ "eval_macro_fpr": 0.023326126599014015,
91
+ "eval_macro_sensitivity": 0.4865735295815666,
92
+ "eval_macro_specificity": 0.9815978320880049,
93
+ "eval_precision": 0.7340611054176746,
94
+ "eval_precision_macro": 0.4982390488816621,
95
+ "eval_recall": 0.7536793183578622,
96
+ "eval_recall_macro": 0.4865735295815666,
97
+ "eval_runtime": 33.282,
98
+ "eval_samples_per_second": 38.79,
99
+ "eval_steps_per_second": 4.868,
100
+ "eval_weighted_fpr": 0.022812051649928264,
101
+ "eval_weighted_sensitivity": 0.7536793183578622,
102
+ "eval_weighted_specificity": 0.9702881629622103,
103
  "step": 643
104
  },
105
  {
106
  "epoch": 5.0,
107
+ "eval_accuracy": 0.7652982184353214,
108
+ "eval_f1_macro": 0.4824234674423381,
109
+ "eval_f1_micro": 0.7652982184353214,
110
+ "eval_f1_weighted": 0.7415202198150465,
111
+ "eval_loss": 0.6963701844215393,
112
+ "eval_macro_fpr": 0.022125198961045537,
113
+ "eval_macro_sensitivity": 0.5099998711032655,
114
+ "eval_macro_specificity": 0.982427621700107,
115
+ "eval_precision": 0.7403884847240659,
116
+ "eval_precision_macro": 0.5015009503316971,
117
+ "eval_recall": 0.7652982184353214,
118
+ "eval_recall_macro": 0.5099998711032655,
119
+ "eval_runtime": 29.8835,
120
+ "eval_samples_per_second": 43.201,
121
+ "eval_steps_per_second": 5.421,
122
+ "eval_weighted_fpr": 0.02143615139724089,
123
+ "eval_weighted_sensitivity": 0.7652982184353214,
124
+ "eval_weighted_specificity": 0.9711161070662828,
125
  "step": 803
126
  },
127
  {
128
  "epoch": 6.0,
129
+ "eval_accuracy": 0.7807900852052673,
130
+ "eval_f1_macro": 0.5371165387852578,
131
+ "eval_f1_micro": 0.7807900852052673,
132
+ "eval_f1_weighted": 0.7659242764458758,
133
+ "eval_loss": 0.684776246547699,
134
+ "eval_macro_fpr": 0.020129954279912522,
135
+ "eval_macro_sensitivity": 0.5604626117585171,
136
+ "eval_macro_specificity": 0.9836211797331506,
137
+ "eval_precision": 0.7919069236021963,
138
+ "eval_precision_macro": 0.5968972302554038,
139
+ "eval_recall": 0.7807900852052673,
140
+ "eval_recall_macro": 0.5604626117585171,
141
+ "eval_runtime": 29.4753,
142
+ "eval_samples_per_second": 43.799,
143
+ "eval_steps_per_second": 5.496,
144
+ "eval_weighted_fpr": 0.019659604029176797,
145
+ "eval_weighted_sensitivity": 0.7807900852052673,
146
+ "eval_weighted_specificity": 0.9735276107919913,
147
  "step": 964
148
  },
149
  {
150
  "epoch": 6.22,
151
+ "learning_rate": 2.916666666666667e-05,
152
+ "loss": 0.5985,
153
  "step": 1000
154
  },
155
  {
156
  "epoch": 7.0,
157
+ "eval_accuracy": 0.7978311386522076,
158
+ "eval_f1_macro": 0.6191969834738721,
159
+ "eval_f1_micro": 0.7978311386522076,
160
+ "eval_f1_weighted": 0.7857784690137476,
161
+ "eval_loss": 0.6644509434700012,
162
+ "eval_macro_fpr": 0.018390423375855742,
163
+ "eval_macro_sensitivity": 0.6251682037032721,
164
+ "eval_macro_specificity": 0.9848362780039965,
165
+ "eval_precision": 0.7880411922037887,
166
+ "eval_precision_macro": 0.6671036841379524,
167
+ "eval_recall": 0.7978311386522076,
168
+ "eval_recall_macro": 0.6251682037032721,
169
+ "eval_runtime": 29.8127,
170
+ "eval_samples_per_second": 43.304,
171
+ "eval_steps_per_second": 5.434,
172
+ "eval_weighted_fpr": 0.017778080512226686,
173
+ "eval_weighted_sensitivity": 0.7978311386522076,
174
+ "eval_weighted_specificity": 0.9747130314077416,
175
  "step": 1125
176
  }
177
  ],
178
  "logging_steps": 500,
179
+ "max_steps": 2400,
180
+ "num_train_epochs": 15,
181
  "save_steps": 500,
182
  "total_flos": 9761403521544192.0,
183
  "trial_name": null,
training_checkpoints/checkpoint-1125/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1be05b6bb510587fe353991f6f2836b34a5909cbc5adc58389938bd163228a1f
3
  size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36a33fe5941ace0a96599f0a2229d1ce6d7002fe79c5372925862ab481915414
3
  size 4600