File size: 8,390 Bytes
c528230
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
{
  "best_metric": 0.6654040404040403,
  "best_model_checkpoint": "twitter-roberta-base-WNUT/checkpoint-500",
  "epoch": 10.0,
  "global_step": 540,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.46,
      "eval_accuracy": 0.9205491641772071,
      "eval_f1": 0.0,
      "eval_loss": 0.39121243357658386,
      "eval_precision": 0.0,
      "eval_recall": 0.0,
      "eval_runtime": 1.5425,
      "eval_samples_per_second": 654.138,
      "eval_steps_per_second": 0.648,
      "step": 25
    },
    {
      "epoch": 0.93,
      "eval_accuracy": 0.9209305281891565,
      "eval_f1": 0.004739336492890995,
      "eval_loss": 0.2846619784832001,
      "eval_precision": 0.25,
      "eval_recall": 0.0023923444976076554,
      "eval_runtime": 1.5304,
      "eval_samples_per_second": 659.288,
      "eval_steps_per_second": 0.653,
      "step": 50
    },
    {
      "epoch": 1.39,
      "eval_accuracy": 0.9426047162016145,
      "eval_f1": 0.4239766081871345,
      "eval_loss": 0.2449360191822052,
      "eval_precision": 0.5451127819548872,
      "eval_recall": 0.34688995215311,
      "eval_runtime": 1.487,
      "eval_samples_per_second": 678.556,
      "eval_steps_per_second": 0.673,
      "step": 75
    },
    {
      "epoch": 1.85,
      "eval_accuracy": 0.9491514650734125,
      "eval_f1": 0.5565455791638108,
      "eval_loss": 0.19464540481567383,
      "eval_precision": 0.651685393258427,
      "eval_recall": 0.48564593301435405,
      "eval_runtime": 1.5409,
      "eval_samples_per_second": 654.812,
      "eval_steps_per_second": 0.649,
      "step": 100
    },
    {
      "epoch": 2.31,
      "eval_accuracy": 0.9581135193542236,
      "eval_f1": 0.621870882740448,
      "eval_loss": 0.1851097047328949,
      "eval_precision": 0.6920821114369502,
      "eval_recall": 0.5645933014354066,
      "eval_runtime": 1.5283,
      "eval_samples_per_second": 660.202,
      "eval_steps_per_second": 0.654,
      "step": 125
    },
    {
      "epoch": 2.78,
      "eval_accuracy": 0.9594482933960465,
      "eval_f1": 0.6331399097356544,
      "eval_loss": 0.1671772003173828,
      "eval_precision": 0.6867132867132867,
      "eval_recall": 0.5873205741626795,
      "eval_runtime": 1.7364,
      "eval_samples_per_second": 581.088,
      "eval_steps_per_second": 0.576,
      "step": 150
    },
    {
      "epoch": 3.24,
      "eval_accuracy": 0.9615457954617682,
      "eval_f1": 0.6276527331189711,
      "eval_loss": 0.16754180192947388,
      "eval_precision": 0.6787204450625869,
      "eval_recall": 0.583732057416268,
      "eval_runtime": 1.522,
      "eval_samples_per_second": 662.938,
      "eval_steps_per_second": 0.657,
      "step": 175
    },
    {
      "epoch": 3.7,
      "eval_accuracy": 0.9637704188648064,
      "eval_f1": 0.65389369592089,
      "eval_loss": 0.16441918909549713,
      "eval_precision": 0.6764705882352942,
      "eval_recall": 0.6327751196172249,
      "eval_runtime": 1.5477,
      "eval_samples_per_second": 651.939,
      "eval_steps_per_second": 0.646,
      "step": 200
    },
    {
      "epoch": 4.17,
      "eval_accuracy": 0.9640246615394394,
      "eval_f1": 0.673697270471464,
      "eval_loss": 0.1672356277704239,
      "eval_precision": 0.6997422680412371,
      "eval_recall": 0.6495215311004785,
      "eval_runtime": 1.5668,
      "eval_samples_per_second": 643.973,
      "eval_steps_per_second": 0.638,
      "step": 225
    },
    {
      "epoch": 4.63,
      "eval_accuracy": 0.9648509502319964,
      "eval_f1": 0.6666666666666666,
      "eval_loss": 0.16518081724643707,
      "eval_precision": 0.6915167095115681,
      "eval_recall": 0.6435406698564593,
      "eval_runtime": 1.544,
      "eval_samples_per_second": 653.501,
      "eval_steps_per_second": 0.648,
      "step": 250
    },
    {
      "epoch": 5.09,
      "eval_accuracy": 0.9629441301722494,
      "eval_f1": 0.6520618556701031,
      "eval_loss": 0.18820269405841827,
      "eval_precision": 0.7067039106145251,
      "eval_recall": 0.6052631578947368,
      "eval_runtime": 1.5459,
      "eval_samples_per_second": 652.688,
      "eval_steps_per_second": 0.647,
      "step": 275
    },
    {
      "epoch": 5.56,
      "eval_accuracy": 0.9644695862200471,
      "eval_f1": 0.6717267552182163,
      "eval_loss": 0.17831429839134216,
      "eval_precision": 0.7127516778523489,
      "eval_recall": 0.6351674641148325,
      "eval_runtime": 1.5976,
      "eval_samples_per_second": 631.564,
      "eval_steps_per_second": 0.626,
      "step": 300
    },
    {
      "epoch": 6.02,
      "eval_accuracy": 0.9638975402021229,
      "eval_f1": 0.6564885496183207,
      "eval_loss": 0.18128034472465515,
      "eval_precision": 0.7010869565217391,
      "eval_recall": 0.6172248803827751,
      "eval_runtime": 1.5524,
      "eval_samples_per_second": 649.966,
      "eval_steps_per_second": 0.644,
      "step": 325
    },
    {
      "epoch": 6.48,
      "eval_accuracy": 0.96472382889468,
      "eval_f1": 0.677561282212445,
      "eval_loss": 0.18036700785160065,
      "eval_precision": 0.713907284768212,
      "eval_recall": 0.6447368421052632,
      "eval_runtime": 1.6249,
      "eval_samples_per_second": 620.943,
      "eval_steps_per_second": 0.615,
      "step": 350
    },
    {
      "epoch": 6.94,
      "eval_accuracy": 0.9640882222080976,
      "eval_f1": 0.6709346991037132,
      "eval_loss": 0.19022008776664734,
      "eval_precision": 0.721763085399449,
      "eval_recall": 0.6267942583732058,
      "eval_runtime": 1.8093,
      "eval_samples_per_second": 557.663,
      "eval_steps_per_second": 0.553,
      "step": 375
    },
    {
      "epoch": 7.41,
      "eval_accuracy": 0.9640882222080976,
      "eval_f1": 0.668777707409753,
      "eval_loss": 0.1882619857788086,
      "eval_precision": 0.7106325706594886,
      "eval_recall": 0.631578947368421,
      "eval_runtime": 1.62,
      "eval_samples_per_second": 622.858,
      "eval_steps_per_second": 0.617,
      "step": 400
    },
    {
      "epoch": 7.87,
      "eval_accuracy": 0.9642789042140724,
      "eval_f1": 0.6683480453972257,
      "eval_loss": 0.18618735671043396,
      "eval_precision": 0.7066666666666667,
      "eval_recall": 0.6339712918660287,
      "eval_runtime": 1.5944,
      "eval_samples_per_second": 632.853,
      "eval_steps_per_second": 0.627,
      "step": 425
    },
    {
      "epoch": 8.33,
      "eval_accuracy": 0.9638975402021229,
      "eval_f1": 0.6670870113493064,
      "eval_loss": 0.1881590634584427,
      "eval_precision": 0.7053333333333334,
      "eval_recall": 0.6327751196172249,
      "eval_runtime": 1.7003,
      "eval_samples_per_second": 593.415,
      "eval_steps_per_second": 0.588,
      "step": 450
    },
    {
      "epoch": 8.8,
      "eval_accuracy": 0.9638339795334647,
      "eval_f1": 0.6658243840808591,
      "eval_loss": 0.19190868735313416,
      "eval_precision": 0.7054886211512718,
      "eval_recall": 0.6303827751196173,
      "eval_runtime": 1.543,
      "eval_samples_per_second": 653.928,
      "eval_steps_per_second": 0.648,
      "step": 475
    },
    {
      "epoch": 9.26,
      "learning_rate": 1.4814814814814815e-06,
      "loss": 0.1175,
      "step": 500
    },
    {
      "epoch": 9.26,
      "eval_accuracy": 0.9639611008707811,
      "eval_f1": 0.6654040404040403,
      "eval_loss": 0.19381117820739746,
      "eval_precision": 0.7045454545454546,
      "eval_recall": 0.6303827751196173,
      "eval_runtime": 1.541,
      "eval_samples_per_second": 654.789,
      "eval_steps_per_second": 0.649,
      "step": 500
    },
    {
      "epoch": 9.72,
      "eval_accuracy": 0.9645967075573635,
      "eval_f1": 0.6704190118824266,
      "eval_loss": 0.18799594044685364,
      "eval_precision": 0.7024901703800787,
      "eval_recall": 0.6411483253588517,
      "eval_runtime": 1.6071,
      "eval_samples_per_second": 627.849,
      "eval_steps_per_second": 0.622,
      "step": 525
    },
    {
      "epoch": 10.0,
      "step": 540,
      "total_flos": 1009327449452316.0,
      "train_loss": 0.11085769158822519,
      "train_runtime": 157.5154,
      "train_samples_per_second": 215.471,
      "train_steps_per_second": 3.428
    }
  ],
  "max_steps": 540,
  "num_train_epochs": 10,
  "total_flos": 1009327449452316.0,
  "trial_name": null,
  "trial_params": null
}