Darius07 commited on
Commit
33bded9
1 Parent(s): 47506a6

End of training

Browse files
Files changed (5) hide show
  1. README.md +4 -4
  2. all_results.json +11 -11
  3. eval_results.json +8 -8
  4. train_results.json +3 -3
  5. trainer_state.json +137 -137
README.md CHANGED
@@ -4,7 +4,7 @@ base_model: xlm-roberta-base
4
  tags:
5
  - generated_from_trainer
6
  datasets:
7
- - universal_ner
8
  metrics:
9
  - precision
10
  - recall
@@ -17,8 +17,8 @@ model-index:
17
  name: Token Classification
18
  type: token-classification
19
  dataset:
20
- name: universal_ner
21
- type: universal_ner
22
  config: en_ewt
23
  split: validation
24
  args: en_ewt
@@ -42,7 +42,7 @@ should probably proofread and complete it, then remove this comment. -->
42
 
43
  # UNER_subword_tk_en_lora_alpha_64_drop_0.3_rank_32_seed_42
44
 
45
- This model is a fine-tuned version of [xlm-roberta-base](https://huggingface.co/xlm-roberta-base) on the universal_ner dataset.
46
  It achieves the following results on the evaluation set:
47
  - Loss: 0.0607
48
  - Precision: 0.7736
 
4
  tags:
5
  - generated_from_trainer
6
  datasets:
7
+ - universalner/universal_ner
8
  metrics:
9
  - precision
10
  - recall
 
17
  name: Token Classification
18
  type: token-classification
19
  dataset:
20
+ name: universalner/universal_ner en_ewt
21
+ type: universalner/universal_ner
22
  config: en_ewt
23
  split: validation
24
  args: en_ewt
 
42
 
43
  # UNER_subword_tk_en_lora_alpha_64_drop_0.3_rank_32_seed_42
44
 
45
+ This model is a fine-tuned version of [xlm-roberta-base](https://huggingface.co/xlm-roberta-base) on the universalner/universal_ner en_ewt dataset.
46
  It achieves the following results on the evaluation set:
47
  - Loss: 0.0607
48
  - Precision: 0.7736
all_results.json CHANGED
@@ -1,18 +1,18 @@
1
  {
2
  "epoch": 20.0,
3
- "eval_accuracy": 0.9841743210465624,
4
- "eval_f1": 0.8008028098344204,
5
- "eval_loss": 0.06448859721422195,
6
- "eval_precision": 0.7770204479065238,
7
- "eval_recall": 0.8260869565217391,
8
- "eval_runtime": 6.7213,
9
  "eval_samples": 2001,
10
- "eval_samples_per_second": 297.711,
11
- "eval_steps_per_second": 37.344,
12
  "total_flos": 8817316923832968.0,
13
  "train_loss": 0.038693137679781234,
14
- "train_runtime": 671.6771,
15
  "train_samples": 12543,
16
- "train_samples_per_second": 373.483,
17
- "train_steps_per_second": 11.672
18
  }
 
1
  {
2
  "epoch": 20.0,
3
+ "eval_accuracy": 0.9840550320092251,
4
+ "eval_f1": 0.7979949874686717,
5
+ "eval_loss": 0.060650501400232315,
6
+ "eval_precision": 0.7735665694849369,
7
+ "eval_recall": 0.8240165631469979,
8
+ "eval_runtime": 2.1367,
9
  "eval_samples": 2001,
10
+ "eval_samples_per_second": 936.473,
11
+ "eval_steps_per_second": 29.484,
12
  "total_flos": 8817316923832968.0,
13
  "train_loss": 0.038693137679781234,
14
+ "train_runtime": 596.8038,
15
  "train_samples": 12543,
16
+ "train_samples_per_second": 420.339,
17
+ "train_steps_per_second": 13.137
18
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 20.0,
3
- "eval_accuracy": 0.9841743210465624,
4
- "eval_f1": 0.8008028098344204,
5
- "eval_loss": 0.06448859721422195,
6
- "eval_precision": 0.7770204479065238,
7
- "eval_recall": 0.8260869565217391,
8
- "eval_runtime": 6.7213,
9
  "eval_samples": 2001,
10
- "eval_samples_per_second": 297.711,
11
- "eval_steps_per_second": 37.344
12
  }
 
1
  {
2
  "epoch": 20.0,
3
+ "eval_accuracy": 0.9840550320092251,
4
+ "eval_f1": 0.7979949874686717,
5
+ "eval_loss": 0.060650501400232315,
6
+ "eval_precision": 0.7735665694849369,
7
+ "eval_recall": 0.8240165631469979,
8
+ "eval_runtime": 2.1367,
9
  "eval_samples": 2001,
10
+ "eval_samples_per_second": 936.473,
11
+ "eval_steps_per_second": 29.484
12
  }
train_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 20.0,
3
  "total_flos": 8817316923832968.0,
4
  "train_loss": 0.038693137679781234,
5
- "train_runtime": 671.6771,
6
  "train_samples": 12543,
7
- "train_samples_per_second": 373.483,
8
- "train_steps_per_second": 11.672
9
  }
 
2
  "epoch": 20.0,
3
  "total_flos": 8817316923832968.0,
4
  "train_loss": 0.038693137679781234,
5
+ "train_runtime": 596.8038,
6
  "train_samples": 12543,
7
+ "train_samples_per_second": 420.339,
8
+ "train_steps_per_second": 13.137
9
  }
trainer_state.json CHANGED
@@ -10,14 +10,14 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.9740745158853235,
14
- "eval_f1": 0.6371191135734072,
15
- "eval_loss": 0.09594480693340302,
16
- "eval_precision": 0.575,
17
  "eval_recall": 0.7142857142857143,
18
- "eval_runtime": 6.7658,
19
- "eval_samples_per_second": 295.753,
20
- "eval_steps_per_second": 37.099,
21
  "step": 392
22
  },
23
  {
@@ -29,14 +29,14 @@
29
  },
30
  {
31
  "epoch": 2.0,
32
- "eval_accuracy": 0.9798401526899678,
33
  "eval_f1": 0.7409200968523002,
34
- "eval_loss": 0.07035845518112183,
35
  "eval_precision": 0.6960873521383075,
36
  "eval_recall": 0.7919254658385093,
37
- "eval_runtime": 6.6994,
38
- "eval_samples_per_second": 298.683,
39
- "eval_steps_per_second": 37.466,
40
  "step": 784
41
  },
42
  {
@@ -48,14 +48,14 @@
48
  },
49
  {
50
  "epoch": 3.0,
51
- "eval_accuracy": 0.9814306731878008,
52
  "eval_f1": 0.7639691714836224,
53
- "eval_loss": 0.07102187722921371,
54
  "eval_precision": 0.7144144144144144,
55
  "eval_recall": 0.8209109730848861,
56
- "eval_runtime": 6.7074,
57
- "eval_samples_per_second": 298.328,
58
- "eval_steps_per_second": 37.421,
59
  "step": 1176
60
  },
61
  {
@@ -67,26 +67,26 @@
67
  },
68
  {
69
  "epoch": 4.0,
70
- "eval_accuracy": 0.9820668813869339,
71
  "eval_f1": 0.7654440154440154,
72
- "eval_loss": 0.06226913630962372,
73
  "eval_precision": 0.716998191681736,
74
  "eval_recall": 0.8209109730848861,
75
- "eval_runtime": 6.6379,
76
- "eval_samples_per_second": 301.45,
77
- "eval_steps_per_second": 37.813,
78
  "step": 1568
79
  },
80
  {
81
  "epoch": 5.0,
82
  "eval_accuracy": 0.9819873553620422,
83
  "eval_f1": 0.7762645914396887,
84
- "eval_loss": 0.06265858560800552,
85
  "eval_precision": 0.7321100917431193,
86
  "eval_recall": 0.8260869565217391,
87
- "eval_runtime": 6.7117,
88
- "eval_samples_per_second": 298.137,
89
- "eval_steps_per_second": 37.398,
90
  "step": 1960
91
  },
92
  {
@@ -98,14 +98,14 @@
98
  },
99
  {
100
  "epoch": 6.0,
101
- "eval_accuracy": 0.9826235635611754,
102
- "eval_f1": 0.7796278158667973,
103
- "eval_loss": 0.06144500896334648,
104
- "eval_precision": 0.7397769516728625,
105
- "eval_recall": 0.8240165631469979,
106
- "eval_runtime": 6.6293,
107
- "eval_samples_per_second": 301.841,
108
- "eval_steps_per_second": 37.862,
109
  "step": 2352
110
  },
111
  {
@@ -117,14 +117,14 @@
117
  },
118
  {
119
  "epoch": 7.0,
120
- "eval_accuracy": 0.9828621416358503,
121
  "eval_f1": 0.7857491459248416,
122
- "eval_loss": 0.06205696985125542,
123
  "eval_precision": 0.7433056325023084,
124
  "eval_recall": 0.8333333333333334,
125
- "eval_runtime": 6.7173,
126
- "eval_samples_per_second": 297.888,
127
- "eval_steps_per_second": 37.366,
128
  "step": 2744
129
  },
130
  {
@@ -136,14 +136,14 @@
136
  },
137
  {
138
  "epoch": 8.0,
139
- "eval_accuracy": 0.9846514771959124,
140
- "eval_f1": 0.8008008008008008,
141
- "eval_loss": 0.06194039061665535,
142
- "eval_precision": 0.7751937984496124,
143
  "eval_recall": 0.8281573498964804,
144
- "eval_runtime": 6.6418,
145
- "eval_samples_per_second": 301.272,
146
- "eval_steps_per_second": 37.791,
147
  "step": 3136
148
  },
149
  {
@@ -155,26 +155,26 @@
155
  },
156
  {
157
  "epoch": 9.0,
158
- "eval_accuracy": 0.9834188238100918,
159
- "eval_f1": 0.7904903417533433,
160
- "eval_loss": 0.06049573794007301,
161
- "eval_precision": 0.7578347578347578,
162
- "eval_recall": 0.8260869565217391,
163
- "eval_runtime": 6.7155,
164
- "eval_samples_per_second": 297.969,
165
- "eval_steps_per_second": 37.376,
166
  "step": 3528
167
  },
168
  {
169
  "epoch": 10.0,
170
- "eval_accuracy": 0.9848502922581415,
171
- "eval_f1": 0.804,
172
- "eval_loss": 0.05974126234650612,
173
- "eval_precision": 0.7775628626692457,
174
- "eval_recall": 0.8322981366459627,
175
- "eval_runtime": 6.7117,
176
- "eval_samples_per_second": 298.137,
177
- "eval_steps_per_second": 37.397,
178
  "step": 3920
179
  },
180
  {
@@ -187,13 +187,13 @@
187
  {
188
  "epoch": 11.0,
189
  "eval_accuracy": 0.9834983498349835,
190
- "eval_f1": 0.7948717948717949,
191
- "eval_loss": 0.05979320779442787,
192
- "eval_precision": 0.7589453860640302,
193
  "eval_recall": 0.8343685300207039,
194
- "eval_runtime": 6.6975,
195
- "eval_samples_per_second": 298.769,
196
- "eval_steps_per_second": 37.477,
197
  "step": 4312
198
  },
199
  {
@@ -205,14 +205,14 @@
205
  },
206
  {
207
  "epoch": 12.0,
208
- "eval_accuracy": 0.9841743210465624,
209
- "eval_f1": 0.798183652875883,
210
- "eval_loss": 0.06226903572678566,
211
- "eval_precision": 0.7785433070866141,
212
- "eval_recall": 0.8188405797101449,
213
- "eval_runtime": 6.6365,
214
- "eval_samples_per_second": 301.514,
215
- "eval_steps_per_second": 37.821,
216
  "step": 4704
217
  },
218
  {
@@ -224,26 +224,26 @@
224
  },
225
  {
226
  "epoch": 13.0,
227
- "eval_accuracy": 0.9844924251461291,
228
- "eval_f1": 0.8012078510317061,
229
- "eval_loss": 0.06113631650805473,
230
- "eval_precision": 0.7796278158667973,
231
  "eval_recall": 0.8240165631469979,
232
- "eval_runtime": 6.6332,
233
- "eval_samples_per_second": 301.666,
234
- "eval_steps_per_second": 37.84,
235
  "step": 5096
236
  },
237
  {
238
  "epoch": 14.0,
239
- "eval_accuracy": 0.9835381128474293,
240
- "eval_f1": 0.7942772570300938,
241
- "eval_loss": 0.06113998964428902,
242
- "eval_precision": 0.7587181903864278,
243
- "eval_recall": 0.8333333333333334,
244
- "eval_runtime": 6.6539,
245
- "eval_samples_per_second": 300.725,
246
- "eval_steps_per_second": 37.722,
247
  "step": 5488
248
  },
249
  {
@@ -255,14 +255,14 @@
255
  },
256
  {
257
  "epoch": 15.0,
258
- "eval_accuracy": 0.9844128991212374,
259
- "eval_f1": 0.8028098344204717,
260
- "eval_loss": 0.06239597126841545,
261
- "eval_precision": 0.7789678675754625,
262
  "eval_recall": 0.8281573498964804,
263
- "eval_runtime": 6.7198,
264
- "eval_samples_per_second": 297.776,
265
- "eval_steps_per_second": 37.352,
266
  "step": 5880
267
  },
268
  {
@@ -274,14 +274,14 @@
274
  },
275
  {
276
  "epoch": 16.0,
277
- "eval_accuracy": 0.9841345580341166,
278
- "eval_f1": 0.8019900497512437,
279
- "eval_loss": 0.06371314078569412,
280
- "eval_precision": 0.7720306513409961,
281
- "eval_recall": 0.8343685300207039,
282
- "eval_runtime": 6.6408,
283
- "eval_samples_per_second": 301.319,
284
- "eval_steps_per_second": 37.797,
285
  "step": 6272
286
  },
287
  {
@@ -293,14 +293,14 @@
293
  },
294
  {
295
  "epoch": 17.0,
296
- "eval_accuracy": 0.9839755059843334,
297
- "eval_f1": 0.8014042126379137,
298
- "eval_loss": 0.06424978375434875,
299
- "eval_precision": 0.7772373540856031,
300
- "eval_recall": 0.8271221532091098,
301
- "eval_runtime": 6.6399,
302
- "eval_samples_per_second": 301.361,
303
- "eval_steps_per_second": 37.802,
304
  "step": 6664
305
  },
306
  {
@@ -314,24 +314,24 @@
314
  "epoch": 18.0,
315
  "eval_accuracy": 0.9839755059843334,
316
  "eval_f1": 0.8004002001000501,
317
- "eval_loss": 0.06440357118844986,
318
  "eval_precision": 0.7744433688286544,
319
  "eval_recall": 0.8281573498964804,
320
- "eval_runtime": 6.7187,
321
- "eval_samples_per_second": 297.827,
322
- "eval_steps_per_second": 37.359,
323
  "step": 7056
324
  },
325
  {
326
  "epoch": 19.0,
327
- "eval_accuracy": 0.9842538470714541,
328
- "eval_f1": 0.8035982008995503,
329
- "eval_loss": 0.06508098542690277,
330
- "eval_precision": 0.7768115942028986,
331
- "eval_recall": 0.8322981366459627,
332
- "eval_runtime": 6.7259,
333
- "eval_samples_per_second": 297.506,
334
- "eval_steps_per_second": 37.318,
335
  "step": 7448
336
  },
337
  {
@@ -343,14 +343,14 @@
343
  },
344
  {
345
  "epoch": 20.0,
346
- "eval_accuracy": 0.9841743210465624,
347
- "eval_f1": 0.8008028098344204,
348
- "eval_loss": 0.06448859721422195,
349
- "eval_precision": 0.7770204479065238,
350
- "eval_recall": 0.8260869565217391,
351
- "eval_runtime": 6.703,
352
- "eval_samples_per_second": 298.525,
353
- "eval_steps_per_second": 37.446,
354
  "step": 7840
355
  },
356
  {
@@ -358,9 +358,9 @@
358
  "step": 7840,
359
  "total_flos": 8817316923832968.0,
360
  "train_loss": 0.038693137679781234,
361
- "train_runtime": 671.6771,
362
- "train_samples_per_second": 373.483,
363
- "train_steps_per_second": 11.672
364
  }
365
  ],
366
  "logging_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.973955226847986,
14
+ "eval_f1": 0.6374133949191687,
15
+ "eval_loss": 0.08990096300840378,
16
+ "eval_precision": 0.5754795663052544,
17
  "eval_recall": 0.7142857142857143,
18
+ "eval_runtime": 1.9571,
19
+ "eval_samples_per_second": 1022.422,
20
+ "eval_steps_per_second": 32.19,
21
  "step": 392
22
  },
23
  {
 
29
  },
30
  {
31
  "epoch": 2.0,
32
+ "eval_accuracy": 0.9798799157024136,
33
  "eval_f1": 0.7409200968523002,
34
+ "eval_loss": 0.06505557149648666,
35
  "eval_precision": 0.6960873521383075,
36
  "eval_recall": 0.7919254658385093,
37
+ "eval_runtime": 1.9464,
38
+ "eval_samples_per_second": 1028.043,
39
+ "eval_steps_per_second": 32.367,
40
  "step": 784
41
  },
42
  {
 
48
  },
49
  {
50
  "epoch": 3.0,
51
+ "eval_accuracy": 0.9814704362002465,
52
  "eval_f1": 0.7639691714836224,
53
+ "eval_loss": 0.06638560444116592,
54
  "eval_precision": 0.7144144144144144,
55
  "eval_recall": 0.8209109730848861,
56
+ "eval_runtime": 1.9458,
57
+ "eval_samples_per_second": 1028.343,
58
+ "eval_steps_per_second": 32.377,
59
  "step": 1176
60
  },
61
  {
 
67
  },
68
  {
69
  "epoch": 4.0,
70
+ "eval_accuracy": 0.9821464074118256,
71
  "eval_f1": 0.7654440154440154,
72
+ "eval_loss": 0.05806884169578552,
73
  "eval_precision": 0.716998191681736,
74
  "eval_recall": 0.8209109730848861,
75
+ "eval_runtime": 1.9555,
76
+ "eval_samples_per_second": 1023.292,
77
+ "eval_steps_per_second": 32.218,
78
  "step": 1568
79
  },
80
  {
81
  "epoch": 5.0,
82
  "eval_accuracy": 0.9819873553620422,
83
  "eval_f1": 0.7762645914396887,
84
+ "eval_loss": 0.05841425433754921,
85
  "eval_precision": 0.7321100917431193,
86
  "eval_recall": 0.8260869565217391,
87
+ "eval_runtime": 1.9706,
88
+ "eval_samples_per_second": 1015.404,
89
+ "eval_steps_per_second": 31.969,
90
  "step": 1960
91
  },
92
  {
 
98
  },
99
  {
100
  "epoch": 6.0,
101
+ "eval_accuracy": 0.9826633265736212,
102
+ "eval_f1": 0.7797940166748406,
103
+ "eval_loss": 0.05712873861193657,
104
+ "eval_precision": 0.7409133271202236,
105
+ "eval_recall": 0.8229813664596274,
106
+ "eval_runtime": 1.977,
107
+ "eval_samples_per_second": 1012.156,
108
+ "eval_steps_per_second": 31.867,
109
  "step": 2352
110
  },
111
  {
 
117
  },
118
  {
119
  "epoch": 7.0,
120
+ "eval_accuracy": 0.9829019046482962,
121
  "eval_f1": 0.7857491459248416,
122
+ "eval_loss": 0.05804689601063728,
123
  "eval_precision": 0.7433056325023084,
124
  "eval_recall": 0.8333333333333334,
125
+ "eval_runtime": 1.9531,
126
+ "eval_samples_per_second": 1024.51,
127
+ "eval_steps_per_second": 32.256,
128
  "step": 2744
129
  },
130
  {
 
136
  },
137
  {
138
  "epoch": 8.0,
139
+ "eval_accuracy": 0.9846117141834665,
140
+ "eval_f1": 0.8004002001000501,
141
+ "eval_loss": 0.05779951810836792,
142
+ "eval_precision": 0.7744433688286544,
143
  "eval_recall": 0.8281573498964804,
144
+ "eval_runtime": 1.9641,
145
+ "eval_samples_per_second": 1018.804,
146
+ "eval_steps_per_second": 32.076,
147
  "step": 3136
148
  },
149
  {
 
155
  },
156
  {
157
  "epoch": 9.0,
158
+ "eval_accuracy": 0.9834585868225377,
159
+ "eval_f1": 0.7914809311540367,
160
+ "eval_loss": 0.056642863899469376,
161
+ "eval_precision": 0.7587844254510921,
162
+ "eval_recall": 0.8271221532091098,
163
+ "eval_runtime": 1.9436,
164
+ "eval_samples_per_second": 1029.513,
165
+ "eval_steps_per_second": 32.413,
166
  "step": 3528
167
  },
168
  {
169
  "epoch": 10.0,
170
+ "eval_accuracy": 0.9847707662332499,
171
+ "eval_f1": 0.8019999999999999,
172
+ "eval_loss": 0.05644238740205765,
173
+ "eval_precision": 0.7756286266924565,
174
+ "eval_recall": 0.8302277432712215,
175
+ "eval_runtime": 1.9568,
176
+ "eval_samples_per_second": 1022.58,
177
+ "eval_steps_per_second": 32.195,
178
  "step": 3920
179
  },
180
  {
 
187
  {
188
  "epoch": 11.0,
189
  "eval_accuracy": 0.9834983498349835,
190
+ "eval_f1": 0.7952639368524913,
191
+ "eval_loss": 0.05572296306490898,
192
+ "eval_precision": 0.7596606974552309,
193
  "eval_recall": 0.8343685300207039,
194
+ "eval_runtime": 1.9713,
195
+ "eval_samples_per_second": 1015.086,
196
+ "eval_steps_per_second": 31.959,
197
  "step": 4312
198
  },
199
  {
 
205
  },
206
  {
207
  "epoch": 12.0,
208
+ "eval_accuracy": 0.9840550320092251,
209
+ "eval_f1": 0.7967644084934277,
210
+ "eval_loss": 0.05849658325314522,
211
+ "eval_precision": 0.7786561264822134,
212
+ "eval_recall": 0.8157349896480331,
213
+ "eval_runtime": 1.9705,
214
+ "eval_samples_per_second": 1015.502,
215
+ "eval_steps_per_second": 31.972,
216
  "step": 4704
217
  },
218
  {
 
224
  },
225
  {
226
  "epoch": 13.0,
227
+ "eval_accuracy": 0.9845321881585749,
228
+ "eval_f1": 0.802015113350126,
229
+ "eval_loss": 0.05740697309374809,
230
+ "eval_precision": 0.7811579980372915,
231
  "eval_recall": 0.8240165631469979,
232
+ "eval_runtime": 1.9671,
233
+ "eval_samples_per_second": 1017.255,
234
+ "eval_steps_per_second": 32.028,
235
  "step": 5096
236
  },
237
  {
238
  "epoch": 14.0,
239
+ "eval_accuracy": 0.983617638872321,
240
+ "eval_f1": 0.7956564659427443,
241
+ "eval_loss": 0.0576859749853611,
242
+ "eval_precision": 0.7603773584905661,
243
+ "eval_recall": 0.8343685300207039,
244
+ "eval_runtime": 1.9779,
245
+ "eval_samples_per_second": 1011.701,
246
+ "eval_steps_per_second": 31.853,
247
  "step": 5488
248
  },
249
  {
 
255
  },
256
  {
257
  "epoch": 15.0,
258
+ "eval_accuracy": 0.9845321881585749,
259
+ "eval_f1": 0.8040201005025126,
260
+ "eval_loss": 0.058342624455690384,
261
+ "eval_precision": 0.78125,
262
  "eval_recall": 0.8281573498964804,
263
+ "eval_runtime": 1.9542,
264
+ "eval_samples_per_second": 1023.925,
265
+ "eval_steps_per_second": 32.238,
266
  "step": 5880
267
  },
268
  {
 
274
  },
275
  {
276
  "epoch": 16.0,
277
+ "eval_accuracy": 0.9840947950216709,
278
+ "eval_f1": 0.802192326856004,
279
+ "eval_loss": 0.05951229855418205,
280
+ "eval_precision": 0.7732949087415946,
281
+ "eval_recall": 0.8333333333333334,
282
+ "eval_runtime": 1.9485,
283
+ "eval_samples_per_second": 1026.943,
284
+ "eval_steps_per_second": 32.333,
285
  "step": 6272
286
  },
287
  {
 
293
  },
294
  {
295
  "epoch": 17.0,
296
+ "eval_accuracy": 0.9839357429718876,
297
+ "eval_f1": 0.8,
298
+ "eval_loss": 0.06028683856129646,
299
+ "eval_precision": 0.7755102040816326,
300
+ "eval_recall": 0.8260869565217391,
301
+ "eval_runtime": 1.9515,
302
+ "eval_samples_per_second": 1025.339,
303
+ "eval_steps_per_second": 32.282,
304
  "step": 6664
305
  },
306
  {
 
314
  "epoch": 18.0,
315
  "eval_accuracy": 0.9839755059843334,
316
  "eval_f1": 0.8004002001000501,
317
+ "eval_loss": 0.06049268692731857,
318
  "eval_precision": 0.7744433688286544,
319
  "eval_recall": 0.8281573498964804,
320
+ "eval_runtime": 1.9474,
321
+ "eval_samples_per_second": 1027.524,
322
+ "eval_steps_per_second": 32.351,
323
  "step": 7056
324
  },
325
  {
326
  "epoch": 19.0,
327
+ "eval_accuracy": 0.9841743210465624,
328
+ "eval_f1": 0.8041958041958043,
329
+ "eval_loss": 0.06108159199357033,
330
+ "eval_precision": 0.777027027027027,
331
+ "eval_recall": 0.8333333333333334,
332
+ "eval_runtime": 1.9732,
333
+ "eval_samples_per_second": 1014.065,
334
+ "eval_steps_per_second": 31.927,
335
  "step": 7448
336
  },
337
  {
 
343
  },
344
  {
345
  "epoch": 20.0,
346
+ "eval_accuracy": 0.9840550320092251,
347
+ "eval_f1": 0.7979949874686717,
348
+ "eval_loss": 0.060650501400232315,
349
+ "eval_precision": 0.7735665694849369,
350
+ "eval_recall": 0.8240165631469979,
351
+ "eval_runtime": 1.9653,
352
+ "eval_samples_per_second": 1018.178,
353
+ "eval_steps_per_second": 32.057,
354
  "step": 7840
355
  },
356
  {
 
358
  "step": 7840,
359
  "total_flos": 8817316923832968.0,
360
  "train_loss": 0.038693137679781234,
361
+ "train_runtime": 596.8038,
362
+ "train_samples_per_second": 420.339,
363
+ "train_steps_per_second": 13.137
364
  }
365
  ],
366
  "logging_steps": 500,