ShengdingHu commited on
Commit
2b88c4e
1 Parent(s): 9ca3b9d

Training in progress, step 200

Browse files
all_results.json CHANGED
@@ -1,18 +1,18 @@
1
  {
2
  "epoch": 20.0,
3
- "eval_accuracy": 72.47706422018348,
4
- "eval_average_metrics": 72.47706422018348,
5
- "eval_loss": 0.27757981419563293,
6
- "eval_runtime": 4.7969,
7
- "eval_samples_per_second": 340.847,
8
- "test_accuracy": 70.58103975535168,
9
- "test_average_metrics": 70.58103975535168,
10
- "test_loss": 0.2894817888736725,
11
- "test_runtime": 4.7627,
12
- "test_samples_per_second": 343.293,
13
- "train_loss": 0.2005054286374884,
14
- "train_runtime": 1293.5612,
15
  "train_samples": 9427,
16
- "train_samples_per_second": 145.753,
17
- "train_steps_per_second": 4.561
18
  }
 
1
  {
2
  "epoch": 20.0,
3
+ "eval_accuracy": 80.30581039755351,
4
+ "eval_average_metrics": 80.30581039755351,
5
+ "eval_loss": 0.19154316186904907,
6
+ "eval_runtime": 17.148,
7
+ "eval_samples_per_second": 95.346,
8
+ "test_accuracy": 79.7553516819572,
9
+ "test_average_metrics": 79.7553516819572,
10
+ "test_loss": 0.195680171251297,
11
+ "test_runtime": 16.947,
12
+ "test_samples_per_second": 96.477,
13
+ "train_loss": 0.20100380073159427,
14
+ "train_runtime": 3071.6757,
15
  "train_samples": 9427,
16
+ "train_samples_per_second": 61.38,
17
+ "train_steps_per_second": 1.921
18
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 20.0,
3
- "eval_accuracy": 72.47706422018348,
4
- "eval_average_metrics": 72.47706422018348,
5
- "eval_loss": 0.27757981419563293,
6
- "eval_runtime": 4.7969,
7
- "eval_samples_per_second": 340.847
8
  }
 
1
  {
2
  "epoch": 20.0,
3
+ "eval_accuracy": 80.30581039755351,
4
+ "eval_average_metrics": 80.30581039755351,
5
+ "eval_loss": 0.19154316186904907,
6
+ "eval_runtime": 17.148,
7
+ "eval_samples_per_second": 95.346
8
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d907e117080258b82f53f820a08988498f89966c5617a158cfd5096e79b285e7
3
- size 1084131
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93702f2d5657da40d960e58c0d8a207b7b6665c7511c220276bc5870e1229f3c
3
+ size 7551621
runs/Feb01_02-19-43_node2/1643653271.165788/events.out.tfevents.1643653271.node2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27b588b667de3756bb574b0790936ea051f3054dd34b04455df005e66d0e9bfb
3
+ size 5044
runs/Feb01_02-19-43_node2/events.out.tfevents.1643653271.node2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaa08ff2b0b29d280b9ce591126682b27ad4ad26343fa7714d6f90dd98bd22a3
3
+ size 4333
runs/Jan31_20-58-56_node1/events.out.tfevents.1643634109.node1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d0625210d64e8317920bc3bf2bbdd4c716e747700612e69b2917e299c1d7049
3
- size 15076
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:668c52d279f48f36addf8c932a25b2cad84c9178c36e0cff80f5e558e31a8849
3
+ size 15752
runs/Jan31_20-58-56_node1/events.out.tfevents.1643637198.node1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b626167b86719a374ddb37c8ab47614b8b66cf90adbd4e8a141fc0db128dad03
3
+ size 684
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 20.0,
3
- "test_accuracy": 70.58103975535168,
4
- "test_average_metrics": 70.58103975535168,
5
- "test_loss": 0.2894817888736725,
6
- "test_runtime": 4.7627,
7
- "test_samples_per_second": 343.293
8
  }
 
1
  {
2
  "epoch": 20.0,
3
+ "test_accuracy": 79.7553516819572,
4
+ "test_average_metrics": 79.7553516819572,
5
+ "test_loss": 0.195680171251297,
6
+ "test_runtime": 16.947,
7
+ "test_samples_per_second": 96.477
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 20.0,
3
- "train_loss": 0.2005054286374884,
4
- "train_runtime": 1293.5612,
5
  "train_samples": 9427,
6
- "train_samples_per_second": 145.753,
7
- "train_steps_per_second": 4.561
8
  }
 
1
  {
2
  "epoch": 20.0,
3
+ "train_loss": 0.20100380073159427,
4
+ "train_runtime": 3071.6757,
5
  "train_samples": 9427,
6
+ "train_samples_per_second": 61.38,
7
+ "train_steps_per_second": 1.921
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 72.47706422018348,
3
- "best_model_checkpoint": "outputs/adapter/superglue-boolq/checkpoint-3835",
4
  "epoch": 20.0,
5
  "global_step": 5900,
6
  "is_hyper_param_search": false,
@@ -8,264 +8,345 @@
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 1.0,
12
- "eval_accuracy": 62.62996941896024,
13
- "eval_average_metrics": 62.62996941896024,
14
- "eval_loss": 0.2848173677921295,
15
- "eval_runtime": 4.5081,
16
- "eval_samples_per_second": 362.682,
17
- "step": 295
 
 
 
 
 
 
 
 
 
18
  },
19
  {
20
  "epoch": 1.69,
21
  "learning_rate": 0.00027457627118644066,
22
- "loss": 0.3238,
23
  "step": 500
24
  },
25
  {
26
- "epoch": 2.0,
27
- "eval_accuracy": 62.62996941896024,
28
- "eval_average_metrics": 62.62996941896024,
29
- "eval_loss": 0.27746617794036865,
30
- "eval_runtime": 4.4839,
31
- "eval_samples_per_second": 364.64,
32
- "step": 590
33
  },
34
  {
35
- "epoch": 3.0,
36
- "eval_accuracy": 62.62996941896024,
37
- "eval_average_metrics": 62.62996941896024,
38
- "eval_loss": 0.2767568826675415,
39
- "eval_runtime": 4.4969,
40
- "eval_samples_per_second": 363.585,
41
- "step": 885
42
  },
43
  {
44
  "epoch": 3.39,
45
  "learning_rate": 0.00024915254237288135,
46
- "loss": 0.2896,
 
 
 
 
 
 
 
 
 
47
  "step": 1000
48
  },
49
  {
50
- "epoch": 4.0,
51
- "eval_accuracy": 62.75229357798165,
52
- "eval_average_metrics": 62.75229357798165,
53
- "eval_loss": 0.2767893373966217,
54
- "eval_runtime": 4.7449,
55
- "eval_samples_per_second": 344.579,
56
- "step": 1180
57
  },
58
  {
59
- "epoch": 5.0,
60
- "eval_accuracy": 63.36391437308868,
61
- "eval_average_metrics": 63.36391437308868,
62
- "eval_loss": 0.26716169714927673,
63
- "eval_runtime": 4.7487,
64
- "eval_samples_per_second": 344.302,
65
- "step": 1475
66
  },
67
  {
68
  "epoch": 5.08,
69
  "learning_rate": 0.000223728813559322,
70
- "loss": 0.2823,
71
  "step": 1500
72
  },
73
  {
74
- "epoch": 6.0,
75
- "eval_accuracy": 66.11620795107034,
76
- "eval_average_metrics": 66.11620795107034,
77
- "eval_loss": 0.2606015205383301,
78
- "eval_runtime": 4.7538,
79
- "eval_samples_per_second": 343.936,
80
- "step": 1770
 
 
 
 
 
 
 
 
 
81
  },
82
  {
83
  "epoch": 6.78,
84
  "learning_rate": 0.0001983050847457627,
85
- "loss": 0.2715,
86
  "step": 2000
87
  },
88
  {
89
- "epoch": 7.0,
90
- "eval_accuracy": 69.0519877675841,
91
- "eval_average_metrics": 69.0519877675841,
92
- "eval_loss": 0.25209498405456543,
93
- "eval_runtime": 4.7471,
94
- "eval_samples_per_second": 344.422,
95
- "step": 2065
 
 
 
 
 
 
 
 
 
96
  },
97
  {
98
- "epoch": 8.0,
99
- "eval_accuracy": 69.2354740061162,
100
- "eval_average_metrics": 69.2354740061162,
101
- "eval_loss": 0.25652435421943665,
102
- "eval_runtime": 4.7461,
103
- "eval_samples_per_second": 344.493,
104
- "step": 2360
105
  },
106
  {
107
  "epoch": 8.47,
108
  "learning_rate": 0.0001728813559322034,
109
- "loss": 0.236,
110
  "step": 2500
111
  },
112
  {
113
- "epoch": 9.0,
114
- "eval_accuracy": 71.0091743119266,
115
- "eval_average_metrics": 71.0091743119266,
116
- "eval_loss": 0.24900275468826294,
117
- "eval_runtime": 4.7529,
118
- "eval_samples_per_second": 344.002,
119
- "step": 2655
120
  },
121
  {
122
- "epoch": 10.0,
123
- "eval_accuracy": 71.80428134556574,
124
- "eval_average_metrics": 71.80428134556574,
125
- "eval_loss": 0.2635628283023834,
126
- "eval_runtime": 4.7533,
127
- "eval_samples_per_second": 343.974,
128
- "step": 2950
129
  },
130
  {
131
  "epoch": 10.17,
132
  "learning_rate": 0.00014745762711864405,
133
- "loss": 0.2038,
134
  "step": 3000
135
  },
136
  {
137
- "epoch": 11.0,
138
- "eval_accuracy": 70.70336391437309,
139
- "eval_average_metrics": 70.70336391437309,
140
- "eval_loss": 0.26442670822143555,
141
- "eval_runtime": 4.7661,
142
- "eval_samples_per_second": 343.05,
143
- "step": 3245
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
144
  },
145
  {
146
  "epoch": 11.86,
147
  "learning_rate": 0.00012203389830508474,
148
- "loss": 0.1743,
149
  "step": 3500
150
  },
151
  {
152
- "epoch": 12.0,
153
- "eval_accuracy": 71.49847094801223,
154
- "eval_average_metrics": 71.49847094801223,
155
- "eval_loss": 0.2672346830368042,
156
- "eval_runtime": 4.761,
157
- "eval_samples_per_second": 343.414,
158
- "step": 3540
159
  },
160
  {
161
- "epoch": 13.0,
162
- "eval_accuracy": 72.47706422018348,
163
- "eval_average_metrics": 72.47706422018348,
164
- "eval_loss": 0.27757981419563293,
165
- "eval_runtime": 4.7532,
166
- "eval_samples_per_second": 343.982,
167
- "step": 3835
168
  },
169
  {
170
  "epoch": 13.56,
171
  "learning_rate": 9.661016949152541e-05,
172
- "loss": 0.1493,
 
 
 
 
 
 
 
 
 
173
  "step": 4000
174
  },
175
  {
176
- "epoch": 14.0,
177
- "eval_accuracy": 70.8868501529052,
178
- "eval_average_metrics": 70.8868501529052,
179
- "eval_loss": 0.29447805881500244,
180
- "eval_runtime": 4.7492,
181
- "eval_samples_per_second": 344.268,
182
- "step": 4130
183
  },
184
  {
185
- "epoch": 15.0,
186
- "eval_accuracy": 70.21406727828746,
187
- "eval_average_metrics": 70.21406727828746,
188
- "eval_loss": 0.2965507209300995,
189
- "eval_runtime": 4.7633,
190
- "eval_samples_per_second": 343.251,
191
- "step": 4425
192
  },
193
  {
194
  "epoch": 15.25,
195
  "learning_rate": 7.11864406779661e-05,
196
- "loss": 0.1336,
197
  "step": 4500
198
  },
199
  {
200
- "epoch": 16.0,
201
- "eval_accuracy": 72.29357798165138,
202
- "eval_average_metrics": 72.29357798165138,
203
- "eval_loss": 0.3127536177635193,
204
- "eval_runtime": 4.7675,
205
- "eval_samples_per_second": 342.95,
206
- "step": 4720
 
 
 
 
 
 
 
 
 
207
  },
208
  {
209
  "epoch": 16.95,
210
  "learning_rate": 4.576271186440678e-05,
211
- "loss": 0.1166,
212
  "step": 5000
213
  },
214
  {
215
- "epoch": 17.0,
216
- "eval_accuracy": 70.9480122324159,
217
- "eval_average_metrics": 70.9480122324159,
218
- "eval_loss": 0.3478758931159973,
219
- "eval_runtime": 4.7792,
220
- "eval_samples_per_second": 342.105,
221
- "step": 5015
222
  },
223
  {
224
- "epoch": 18.0,
225
- "eval_accuracy": 72.17125382262996,
226
- "eval_average_metrics": 72.17125382262996,
227
- "eval_loss": 0.33715757727622986,
228
- "eval_runtime": 4.7549,
229
- "eval_samples_per_second": 343.858,
230
- "step": 5310
 
 
 
 
 
 
 
 
 
231
  },
232
  {
233
  "epoch": 18.64,
234
  "learning_rate": 2.0338983050847455e-05,
235
- "loss": 0.1059,
236
  "step": 5500
237
  },
238
  {
239
- "epoch": 19.0,
240
- "eval_accuracy": 71.92660550458716,
241
- "eval_average_metrics": 71.92660550458716,
242
- "eval_loss": 0.34181272983551025,
243
- "eval_runtime": 4.753,
244
- "eval_samples_per_second": 343.993,
245
- "step": 5605
246
  },
247
  {
248
- "epoch": 20.0,
249
- "eval_accuracy": 71.80428134556574,
250
- "eval_average_metrics": 71.80428134556574,
251
- "eval_loss": 0.34913983941078186,
252
- "eval_runtime": 4.7538,
253
- "eval_samples_per_second": 343.937,
254
- "step": 5900
255
  },
256
  {
257
  "epoch": 20.0,
258
  "step": 5900,
259
- "total_flos": 5.78564930408256e+16,
260
- "train_loss": 0.2005054286374884,
261
- "train_runtime": 1293.5612,
262
- "train_samples_per_second": 145.753,
263
- "train_steps_per_second": 4.561
264
  }
265
  ],
266
  "max_steps": 5900,
267
  "num_train_epochs": 20,
268
- "total_flos": 5.78564930408256e+16,
269
  "trial_name": null,
270
  "trial_params": null
271
  }
 
1
  {
2
+ "best_metric": 80.30581039755351,
3
+ "best_model_checkpoint": "outputs/bitfit/t5-base/superglue-boolq/checkpoint-2600",
4
  "epoch": 20.0,
5
  "global_step": 5900,
6
  "is_hyper_param_search": false,
 
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.68,
12
+ "eval_accuracy": 74.6788990825688,
13
+ "eval_average_metrics": 74.6788990825688,
14
+ "eval_loss": 0.21743574738502502,
15
+ "eval_runtime": 16.9831,
16
+ "eval_samples_per_second": 96.272,
17
+ "step": 200
18
+ },
19
+ {
20
+ "epoch": 1.36,
21
+ "eval_accuracy": 75.71865443425077,
22
+ "eval_average_metrics": 75.71865443425077,
23
+ "eval_loss": 0.21506452560424805,
24
+ "eval_runtime": 14.6109,
25
+ "eval_samples_per_second": 111.903,
26
+ "step": 400
27
  },
28
  {
29
  "epoch": 1.69,
30
  "learning_rate": 0.00027457627118644066,
31
+ "loss": 0.374,
32
  "step": 500
33
  },
34
  {
35
+ "epoch": 2.03,
36
+ "eval_accuracy": 77.18654434250764,
37
+ "eval_average_metrics": 77.18654434250764,
38
+ "eval_loss": 0.20255930721759796,
39
+ "eval_runtime": 17.1645,
40
+ "eval_samples_per_second": 95.254,
41
+ "step": 600
42
  },
43
  {
44
+ "epoch": 2.71,
45
+ "eval_accuracy": 76.5137614678899,
46
+ "eval_average_metrics": 76.5137614678899,
47
+ "eval_loss": 0.220754012465477,
48
+ "eval_runtime": 17.1929,
49
+ "eval_samples_per_second": 95.097,
50
+ "step": 800
51
  },
52
  {
53
  "epoch": 3.39,
54
  "learning_rate": 0.00024915254237288135,
55
+ "loss": 0.2114,
56
+ "step": 1000
57
+ },
58
+ {
59
+ "epoch": 3.39,
60
+ "eval_accuracy": 78.1651376146789,
61
+ "eval_average_metrics": 78.1651376146789,
62
+ "eval_loss": 0.19822736084461212,
63
+ "eval_runtime": 14.5865,
64
+ "eval_samples_per_second": 112.09,
65
  "step": 1000
66
  },
67
  {
68
+ "epoch": 4.07,
69
+ "eval_accuracy": 78.71559633027523,
70
+ "eval_average_metrics": 78.71559633027523,
71
+ "eval_loss": 0.19769148528575897,
72
+ "eval_runtime": 17.1866,
73
+ "eval_samples_per_second": 95.132,
74
+ "step": 1200
75
  },
76
  {
77
+ "epoch": 4.75,
78
+ "eval_accuracy": 78.2262996941896,
79
+ "eval_average_metrics": 78.2262996941896,
80
+ "eval_loss": 0.1974276602268219,
81
+ "eval_runtime": 17.1722,
82
+ "eval_samples_per_second": 95.212,
83
+ "step": 1400
84
  },
85
  {
86
  "epoch": 5.08,
87
  "learning_rate": 0.000223728813559322,
88
+ "loss": 0.1997,
89
  "step": 1500
90
  },
91
  {
92
+ "epoch": 5.42,
93
+ "eval_accuracy": 78.71559633027523,
94
+ "eval_average_metrics": 78.71559633027523,
95
+ "eval_loss": 0.19954562187194824,
96
+ "eval_runtime": 14.5679,
97
+ "eval_samples_per_second": 112.233,
98
+ "step": 1600
99
+ },
100
+ {
101
+ "epoch": 6.1,
102
+ "eval_accuracy": 78.2262996941896,
103
+ "eval_average_metrics": 78.2262996941896,
104
+ "eval_loss": 0.20299072563648224,
105
+ "eval_runtime": 17.2624,
106
+ "eval_samples_per_second": 94.714,
107
+ "step": 1800
108
  },
109
  {
110
  "epoch": 6.78,
111
  "learning_rate": 0.0001983050847457627,
112
+ "loss": 0.1934,
113
  "step": 2000
114
  },
115
  {
116
+ "epoch": 6.78,
117
+ "eval_accuracy": 79.63302752293579,
118
+ "eval_average_metrics": 79.63302752293579,
119
+ "eval_loss": 0.19578830897808075,
120
+ "eval_runtime": 17.2808,
121
+ "eval_samples_per_second": 94.614,
122
+ "step": 2000
123
+ },
124
+ {
125
+ "epoch": 7.46,
126
+ "eval_accuracy": 79.26605504587157,
127
+ "eval_average_metrics": 79.26605504587157,
128
+ "eval_loss": 0.1937599629163742,
129
+ "eval_runtime": 15.3794,
130
+ "eval_samples_per_second": 106.311,
131
+ "step": 2200
132
  },
133
  {
134
+ "epoch": 8.14,
135
+ "eval_accuracy": 77.92048929663609,
136
+ "eval_average_metrics": 77.92048929663609,
137
+ "eval_loss": 0.2019716054201126,
138
+ "eval_runtime": 17.5057,
139
+ "eval_samples_per_second": 93.398,
140
+ "step": 2400
141
  },
142
  {
143
  "epoch": 8.47,
144
  "learning_rate": 0.0001728813559322034,
145
+ "loss": 0.1907,
146
  "step": 2500
147
  },
148
  {
149
+ "epoch": 8.81,
150
+ "eval_accuracy": 80.30581039755351,
151
+ "eval_average_metrics": 80.30581039755351,
152
+ "eval_loss": 0.19154316186904907,
153
+ "eval_runtime": 17.3782,
154
+ "eval_samples_per_second": 94.083,
155
+ "step": 2600
156
  },
157
  {
158
+ "epoch": 9.49,
159
+ "eval_accuracy": 79.93883792048929,
160
+ "eval_average_metrics": 79.93883792048929,
161
+ "eval_loss": 0.19677455723285675,
162
+ "eval_runtime": 15.9661,
163
+ "eval_samples_per_second": 102.404,
164
+ "step": 2800
165
  },
166
  {
167
  "epoch": 10.17,
168
  "learning_rate": 0.00014745762711864405,
169
+ "loss": 0.183,
170
  "step": 3000
171
  },
172
  {
173
+ "epoch": 10.17,
174
+ "eval_accuracy": 79.44954128440367,
175
+ "eval_average_metrics": 79.44954128440367,
176
+ "eval_loss": 0.19117017090320587,
177
+ "eval_runtime": 17.2749,
178
+ "eval_samples_per_second": 94.646,
179
+ "step": 3000
180
+ },
181
+ {
182
+ "epoch": 10.85,
183
+ "eval_accuracy": 78.10397553516819,
184
+ "eval_average_metrics": 78.10397553516819,
185
+ "eval_loss": 0.20411182940006256,
186
+ "eval_runtime": 17.1181,
187
+ "eval_samples_per_second": 95.513,
188
+ "step": 3200
189
+ },
190
+ {
191
+ "epoch": 11.53,
192
+ "eval_accuracy": 79.02140672782875,
193
+ "eval_average_metrics": 79.02140672782875,
194
+ "eval_loss": 0.194900244474411,
195
+ "eval_runtime": 17.1955,
196
+ "eval_samples_per_second": 95.083,
197
+ "step": 3400
198
  },
199
  {
200
  "epoch": 11.86,
201
  "learning_rate": 0.00012203389830508474,
202
+ "loss": 0.181,
203
  "step": 3500
204
  },
205
  {
206
+ "epoch": 12.2,
207
+ "eval_accuracy": 79.38837920489297,
208
+ "eval_average_metrics": 79.38837920489297,
209
+ "eval_loss": 0.20091596245765686,
210
+ "eval_runtime": 16.9905,
211
+ "eval_samples_per_second": 96.23,
212
+ "step": 3600
213
  },
214
  {
215
+ "epoch": 12.88,
216
+ "eval_accuracy": 79.81651376146789,
217
+ "eval_average_metrics": 79.81651376146789,
218
+ "eval_loss": 0.18894420564174652,
219
+ "eval_runtime": 17.2706,
220
+ "eval_samples_per_second": 94.669,
221
+ "step": 3800
222
  },
223
  {
224
  "epoch": 13.56,
225
  "learning_rate": 9.661016949152541e-05,
226
+ "loss": 0.1786,
227
+ "step": 4000
228
+ },
229
+ {
230
+ "epoch": 13.56,
231
+ "eval_accuracy": 78.77675840978593,
232
+ "eval_average_metrics": 78.77675840978593,
233
+ "eval_loss": 0.20160046219825745,
234
+ "eval_runtime": 17.0941,
235
+ "eval_samples_per_second": 95.647,
236
  "step": 4000
237
  },
238
  {
239
+ "epoch": 14.24,
240
+ "eval_accuracy": 79.57186544342507,
241
+ "eval_average_metrics": 79.57186544342507,
242
+ "eval_loss": 0.19864365458488464,
243
+ "eval_runtime": 17.0536,
244
+ "eval_samples_per_second": 95.874,
245
+ "step": 4200
246
  },
247
  {
248
+ "epoch": 14.92,
249
+ "eval_accuracy": 79.51070336391437,
250
+ "eval_average_metrics": 79.51070336391437,
251
+ "eval_loss": 0.19150203466415405,
252
+ "eval_runtime": 17.2063,
253
+ "eval_samples_per_second": 95.024,
254
+ "step": 4400
255
  },
256
  {
257
  "epoch": 15.25,
258
  "learning_rate": 7.11864406779661e-05,
259
+ "loss": 0.1769,
260
  "step": 4500
261
  },
262
  {
263
+ "epoch": 15.59,
264
+ "eval_accuracy": 78.77675840978593,
265
+ "eval_average_metrics": 78.77675840978593,
266
+ "eval_loss": 0.19904659688472748,
267
+ "eval_runtime": 17.1806,
268
+ "eval_samples_per_second": 95.165,
269
+ "step": 4600
270
+ },
271
+ {
272
+ "epoch": 16.27,
273
+ "eval_accuracy": 79.20489296636084,
274
+ "eval_average_metrics": 79.20489296636084,
275
+ "eval_loss": 0.19741013646125793,
276
+ "eval_runtime": 17.2538,
277
+ "eval_samples_per_second": 94.762,
278
+ "step": 4800
279
  },
280
  {
281
  "epoch": 16.95,
282
  "learning_rate": 4.576271186440678e-05,
283
+ "loss": 0.1741,
284
  "step": 5000
285
  },
286
  {
287
+ "epoch": 16.95,
288
+ "eval_accuracy": 79.51070336391437,
289
+ "eval_average_metrics": 79.51070336391437,
290
+ "eval_loss": 0.19429509341716766,
291
+ "eval_runtime": 17.4899,
292
+ "eval_samples_per_second": 93.483,
293
+ "step": 5000
294
  },
295
  {
296
+ "epoch": 17.63,
297
+ "eval_accuracy": 78.89908256880734,
298
+ "eval_average_metrics": 78.89908256880734,
299
+ "eval_loss": 0.20053960382938385,
300
+ "eval_runtime": 17.2615,
301
+ "eval_samples_per_second": 94.719,
302
+ "step": 5200
303
+ },
304
+ {
305
+ "epoch": 18.31,
306
+ "eval_accuracy": 79.32721712538226,
307
+ "eval_average_metrics": 79.32721712538226,
308
+ "eval_loss": 0.1975349634885788,
309
+ "eval_runtime": 17.2849,
310
+ "eval_samples_per_second": 94.591,
311
+ "step": 5400
312
  },
313
  {
314
  "epoch": 18.64,
315
  "learning_rate": 2.0338983050847455e-05,
316
+ "loss": 0.1717,
317
  "step": 5500
318
  },
319
  {
320
+ "epoch": 18.98,
321
+ "eval_accuracy": 78.77675840978593,
322
+ "eval_average_metrics": 78.77675840978593,
323
+ "eval_loss": 0.20098499953746796,
324
+ "eval_runtime": 17.3626,
325
+ "eval_samples_per_second": 94.168,
326
+ "step": 5600
327
  },
328
  {
329
+ "epoch": 19.66,
330
+ "eval_accuracy": 79.20489296636084,
331
+ "eval_average_metrics": 79.20489296636084,
332
+ "eval_loss": 0.19755637645721436,
333
+ "eval_runtime": 17.3825,
334
+ "eval_samples_per_second": 94.06,
335
+ "step": 5800
336
  },
337
  {
338
  "epoch": 20.0,
339
  "step": 5900,
340
+ "total_flos": 5.74047486286578e+16,
341
+ "train_loss": 0.20100380073159427,
342
+ "train_runtime": 3071.6757,
343
+ "train_samples_per_second": 61.38,
344
+ "train_steps_per_second": 1.921
345
  }
346
  ],
347
  "max_steps": 5900,
348
  "num_train_epochs": 20,
349
+ "total_flos": 5.74047486286578e+16,
350
  "trial_name": null,
351
  "trial_params": null
352
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:269bb6113ca5087e1a8b4f6f408b50f081fcdff789ba3839dd26d80788deca12
3
  size 3183
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f661110841353ed072f3e206dcbfb7b75b9c2fdbb0068e52fff4617c10698d9e
3
  size 3183
training_config.json CHANGED
@@ -1 +1 @@
1
- {"dataset_config_name": ["en"], "delta_type": "bitfit", "do_eval": true, "do_test": true, "do_train": true, "eval_dataset_config_name": ["en"], "eval_dataset_name": "superglue-boolq", "eval_steps": 200, "evaluation_strategy": "steps", "greater_is_better": true, "learning_rate": 0.0003, "load_best_model_at_end": true, "max_source_length": 256, "metric_for_best_model": "average_metrics", "model_name_or_path": "../../../../plm_cache/t5-base", "num_train_epochs": 20, "output_dir": "outputs/bitfit/t5-base/superglue-boolq", "overwrite_output_dir": true, "per_device_eval_batch_size": 32, "per_device_train_batch_size": 32, "predict_with_generate": true, "push_to_hub": true, "save_steps": 200, "save_strategy": "steps", "save_total_limit": 1, "seed": 42, "split_validation_test": true, "task_name": "superglue-boolq", "test_dataset_config_name": ["en"], "test_dataset_name": "superglue-boolq", "tokenizer_name": "../../../../plm_cache/t5-base", "warmup_steps": 0}
 
1
+ {"bottleneck_dim": 24, "dataset_config_name": ["en"], "delta_type": "adapter", "do_eval": true, "do_test": true, "do_train": true, "eval_dataset_config_name": ["en"], "eval_dataset_name": "superglue-boolq", "eval_steps": 200, "evaluation_strategy": "steps", "greater_is_better": true, "learning_rate": 0.0003, "load_best_model_at_end": true, "max_source_length": 256, "metric_for_best_model": "average_metrics", "model_name_or_path": "../../../../plm_cache/t5-base", "num_train_epochs": 20, "output_dir": "outputs/bitfit/t5-base/superglue-boolq", "overwrite_output_dir": true, "per_device_eval_batch_size": 32, "per_device_train_batch_size": 32, "predict_with_generate": true, "push_to_hub": true, "save_steps": 200, "save_strategy": "steps", "save_total_limit": 1, "seed": 42, "split_validation_test": true, "task_name": "superglue-boolq", "test_dataset_config_name": ["en"], "test_dataset_name": "superglue-boolq", "tokenizer_name": "../../../../plm_cache/t5-base", "unfrozen_modules": ["deltas", "layer_norm", "final_layer_norm"], "warmup_steps": 0}