File size: 7,358 Bytes
f6de6f2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 2.0,
  "eval_steps": 500,
  "global_step": 10940,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.0,
      "learning_rate": 1.9998171846435103e-05,
      "loss": 3.4748,
      "step": 1
    },
    {
      "epoch": 0.23,
      "learning_rate": 1.7714808043875687e-05,
      "loss": 0.3223,
      "step": 1250
    },
    {
      "epoch": 0.46,
      "learning_rate": 1.5429616087751372e-05,
      "loss": 0.1466,
      "step": 2500
    },
    {
      "epoch": 0.69,
      "learning_rate": 1.3144424131627058e-05,
      "loss": 0.1219,
      "step": 3750
    },
    {
      "epoch": 0.91,
      "learning_rate": 1.0859232175502743e-05,
      "loss": 0.1025,
      "step": 5000
    },
    {
      "epoch": 1.0,
      "eval_ANIM": {
        "f1": 0.6988922457200403,
        "number": 3208,
        "precision": 0.5861486486486487,
        "recall": 0.8653366583541147
      },
      "eval_BIO": {
        "f1": 0.5263157894736842,
        "number": 16,
        "precision": 0.45454545454545453,
        "recall": 0.625
      },
      "eval_CEL": {
        "f1": 0.7659574468085106,
        "number": 82,
        "precision": 0.6792452830188679,
        "recall": 0.8780487804878049
      },
      "eval_DIS": {
        "f1": 0.6575342465753424,
        "number": 1518,
        "precision": 0.5229571984435798,
        "recall": 0.8853754940711462
      },
      "eval_EVE": {
        "f1": 0.958100558659218,
        "number": 704,
        "precision": 0.9423076923076923,
        "recall": 0.9744318181818182
      },
      "eval_FOOD": {
        "f1": 0.53125,
        "number": 1132,
        "precision": 0.38825448613376834,
        "recall": 0.8409893992932862
      },
      "eval_INST": {
        "f1": 0.5454545454545454,
        "number": 24,
        "precision": 0.42857142857142855,
        "recall": 0.75
      },
      "eval_LOC": {
        "f1": 0.9938849369774116,
        "number": 24048,
        "precision": 0.9942571785268415,
        "recall": 0.9935129740518962
      },
      "eval_MEDIA": {
        "f1": 0.9480381760339343,
        "number": 916,
        "precision": 0.9216494845360824,
        "recall": 0.9759825327510917
      },
      "eval_MYTH": {
        "f1": 0.6987951807228915,
        "number": 64,
        "precision": 0.5686274509803921,
        "recall": 0.90625
      },
      "eval_ORG": {
        "f1": 0.9804511278195489,
        "number": 6618,
        "precision": 0.9757557617479796,
        "recall": 0.9851919008763977
      },
      "eval_PER": {
        "f1": 0.9935385784872672,
        "number": 10530,
        "precision": 0.9941053432211447,
        "recall": 0.9929724596391263
      },
      "eval_PLANT": {
        "f1": 0.56656346749226,
        "number": 1788,
        "precision": 0.4331360946745562,
        "recall": 0.8187919463087249
      },
      "eval_TIME": {
        "f1": 0.7452830188679245,
        "number": 578,
        "precision": 0.6829971181556196,
        "recall": 0.8200692041522492
      },
      "eval_VEHI": {
        "f1": 0.8571428571428572,
        "number": 64,
        "precision": 0.7894736842105263,
        "recall": 0.9375
      },
      "eval_loss": 0.09848607331514359,
      "eval_overall_accuracy": 0.9839002953677689,
      "eval_overall_f1": 0.9165482757984463,
      "eval_overall_precision": 0.8698606149751348,
      "eval_overall_recall": 0.9685318775589784,
      "eval_runtime": 95.1985,
      "eval_samples_per_second": 345.678,
      "eval_steps_per_second": 7.206,
      "step": 5470
    },
    {
      "epoch": 1.14,
      "learning_rate": 8.574040219378429e-06,
      "loss": 0.0791,
      "step": 6250
    },
    {
      "epoch": 1.37,
      "learning_rate": 6.288848263254113e-06,
      "loss": 0.0668,
      "step": 7500
    },
    {
      "epoch": 1.6,
      "learning_rate": 4.003656307129799e-06,
      "loss": 0.0584,
      "step": 8750
    },
    {
      "epoch": 1.83,
      "learning_rate": 1.7184643510054846e-06,
      "loss": 0.0526,
      "step": 10000
    },
    {
      "epoch": 2.0,
      "eval_ANIM": {
        "f1": 0.7314670813893208,
        "number": 3208,
        "precision": 0.6259982253771074,
        "recall": 0.8796758104738155
      },
      "eval_BIO": {
        "f1": 0.6363636363636364,
        "number": 16,
        "precision": 0.5,
        "recall": 0.875
      },
      "eval_CEL": {
        "f1": 0.7835051546391752,
        "number": 82,
        "precision": 0.6785714285714286,
        "recall": 0.926829268292683
      },
      "eval_DIS": {
        "f1": 0.6950578338590956,
        "number": 1518,
        "precision": 0.5783027121609798,
        "recall": 0.8708827404479579
      },
      "eval_EVE": {
        "f1": 0.9678321678321677,
        "number": 704,
        "precision": 0.953168044077135,
        "recall": 0.9829545454545454
      },
      "eval_FOOD": {
        "f1": 0.5880893300248139,
        "number": 1132,
        "precision": 0.45315487571701724,
        "recall": 0.8374558303886925
      },
      "eval_INST": {
        "f1": 0.5625000000000001,
        "number": 24,
        "precision": 0.45,
        "recall": 0.75
      },
      "eval_LOC": {
        "f1": 0.9941398944349777,
        "number": 24048,
        "precision": 0.9936030572401762,
        "recall": 0.9946773120425815
      },
      "eval_MEDIA": {
        "f1": 0.9540106951871657,
        "number": 916,
        "precision": 0.9350104821802935,
        "recall": 0.9737991266375546
      },
      "eval_MYTH": {
        "f1": 0.8055555555555555,
        "number": 64,
        "precision": 0.725,
        "recall": 0.90625
      },
      "eval_ORG": {
        "f1": 0.9806938159879336,
        "number": 6618,
        "precision": 0.9789220114423366,
        "recall": 0.9824720459353279
      },
      "eval_PER": {
        "f1": 0.9945915172217479,
        "number": 10530,
        "precision": 0.9937428896473265,
        "recall": 0.9954415954415955
      },
      "eval_PLANT": {
        "f1": 0.6153232242617718,
        "number": 1788,
        "precision": 0.478287841191067,
        "recall": 0.8624161073825504
      },
      "eval_TIME": {
        "f1": 0.7310030395136778,
        "number": 578,
        "precision": 0.6517615176151762,
        "recall": 0.8321799307958477
      },
      "eval_VEHI": {
        "f1": 0.8571428571428572,
        "number": 64,
        "precision": 0.7894736842105263,
        "recall": 0.9375
      },
      "eval_loss": 0.11049605160951614,
      "eval_overall_accuracy": 0.9861263597723507,
      "eval_overall_f1": 0.9277588486101026,
      "eval_overall_precision": 0.8877743728620296,
      "eval_overall_recall": 0.9715149151881458,
      "eval_runtime": 94.1134,
      "eval_samples_per_second": 349.663,
      "eval_steps_per_second": 7.289,
      "step": 10940
    },
    {
      "epoch": 2.0,
      "step": 10940,
      "total_flos": 1.929975843125117e+16,
      "train_loss": 0.1132796828881914,
      "train_runtime": 2485.5568,
      "train_samples_per_second": 211.269,
      "train_steps_per_second": 4.401
    }
  ],
  "logging_steps": 1250,
  "max_steps": 10940,
  "num_train_epochs": 2,
  "save_steps": 500,
  "total_flos": 1.929975843125117e+16,
  "trial_name": null,
  "trial_params": null
}