Theoreticallyhugo commited on
Commit
66a7884
1 Parent(s): 0d6953b

Training in progress, epoch 12, checkpoint

Browse files
checkpoint-492/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ca4cfb367f9aeeb0da772b83231edbb93b79495a8028e61b5d39421973f2356
3
  size 592330980
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bdb1250456b729b97b1c9e4a7becd50207d1e640f6540c6acf8c69b9548c993
3
  size 592330980
checkpoint-492/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42d9ff8c975b2985474bb8a840f98d2905fb92836d9ef91e7d06d5d657015a43
3
  size 1014670074
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fb584edc1d9d30ce56cfecb0c407351f6a35ee1cf1a8b44365474b46dc9fe29
3
  size 1014670074
checkpoint-492/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6e53e706c63ba0c275c9b6332ceadb76c337b40858f3ddadb0ab10622a334eb
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c189466643703424c77db24cb1c70bb1b76b65752ddeeaa3d7bb424b6ea3dcb
3
  size 14244
checkpoint-492/trainer_state.json CHANGED
@@ -14,753 +14,753 @@
14
  "f1-score": 0.0,
15
  "precision": 0.0,
16
  "recall": 0.0,
17
- "support": 339.0
18
  },
19
  "eval_B-MajorClaim": {
20
  "f1-score": 0.0,
21
  "precision": 0.0,
22
  "recall": 0.0,
23
- "support": 160.0
24
  },
25
  "eval_B-Premise": {
26
- "f1-score": 0.7931404072883173,
27
- "precision": 0.8,
28
- "recall": 0.7863974495217854,
29
- "support": 941.0
30
  },
31
  "eval_I-Claim": {
32
- "f1-score": 0.40067911714770804,
33
- "precision": 0.46561443066516345,
34
- "recall": 0.35163899531715626,
35
- "support": 4698.0
36
  },
37
  "eval_I-MajorClaim": {
38
- "f1-score": 0.5607655502392344,
39
- "precision": 0.4144271570014144,
40
- "recall": 0.8668639053254438,
41
- "support": 2028.0
42
  },
43
  "eval_I-Premise": {
44
- "f1-score": 0.8556539864512767,
45
- "precision": 0.8844441252513645,
46
- "recall": 0.8286790929277976,
47
- "support": 14861.0
48
  },
49
  "eval_O": {
50
- "f1-score": 0.9839078762825717,
51
- "precision": 0.9700167382286587,
52
- "recall": 0.9982026510896428,
53
- "support": 13353.0
54
  },
55
- "eval_accuracy": 0.8189664650907091,
56
- "eval_loss": 0.4724249243736267,
57
  "eval_macro avg": {
58
- "f1-score": 0.5134495624870155,
59
- "precision": 0.5049289215923716,
60
- "recall": 0.5473974420259752,
61
- "support": 36380.0
62
- },
63
- "eval_runtime": 1.4721,
64
- "eval_samples_per_second": 55.025,
65
- "eval_steps_per_second": 7.473,
66
  "eval_weighted avg": {
67
- "f1-score": 0.8141826255128369,
68
- "precision": 0.8212499318469384,
69
- "recall": 0.8189664650907091,
70
- "support": 36380.0
71
  },
72
  "step": 41
73
  },
74
  {
75
  "epoch": 2.0,
76
  "eval_B-Claim": {
77
- "f1-score": 0.33835845896147404,
78
- "precision": 0.39147286821705424,
79
- "recall": 0.29793510324483774,
80
- "support": 339.0
81
  },
82
  "eval_B-MajorClaim": {
83
- "f1-score": 0.02469135802469136,
84
- "precision": 1.0,
85
- "recall": 0.0125,
86
- "support": 160.0
87
  },
88
  "eval_B-Premise": {
89
- "f1-score": 0.8715509039010466,
90
- "precision": 0.788975021533161,
91
- "recall": 0.973432518597237,
92
- "support": 941.0
93
  },
94
  "eval_I-Claim": {
95
- "f1-score": 0.5235237638022083,
96
- "precision": 0.6001651073197578,
97
- "recall": 0.46424010217113665,
98
- "support": 4698.0
99
  },
100
  "eval_I-MajorClaim": {
101
- "f1-score": 0.7519225291939617,
102
- "precision": 0.890087660148348,
103
- "recall": 0.650887573964497,
104
- "support": 2028.0
105
  },
106
  "eval_I-Premise": {
107
- "f1-score": 0.8986994772408516,
108
- "precision": 0.8537944400702562,
109
- "recall": 0.9485902698337931,
110
- "support": 14861.0
111
  },
112
  "eval_O": {
113
- "f1-score": 0.9990256333383302,
114
- "precision": 0.9998499737454054,
115
- "recall": 0.9982026510896428,
116
- "support": 13353.0
117
  },
118
- "eval_accuracy": 0.8781198460692689,
119
- "eval_loss": 0.2805784344673157,
120
  "eval_macro avg": {
121
- "f1-score": 0.6296817320660805,
122
- "precision": 0.7891921530048547,
123
- "recall": 0.6208268884144491,
124
- "support": 36380.0
125
- },
126
- "eval_runtime": 1.474,
127
- "eval_samples_per_second": 54.951,
128
- "eval_steps_per_second": 7.463,
129
  "eval_weighted avg": {
130
- "f1-score": 0.8691247740581066,
131
- "precision": 0.871331614069924,
132
- "recall": 0.8781198460692689,
133
- "support": 36380.0
134
  },
135
  "step": 82
136
  },
137
  {
138
  "epoch": 3.0,
139
  "eval_B-Claim": {
140
- "f1-score": 0.523191094619666,
141
- "precision": 0.705,
142
- "recall": 0.415929203539823,
143
- "support": 339.0
144
  },
145
  "eval_B-MajorClaim": {
146
- "f1-score": 0.8686868686868686,
147
- "precision": 0.9416058394160584,
148
- "recall": 0.80625,
149
- "support": 160.0
150
  },
151
  "eval_B-Premise": {
152
- "f1-score": 0.888997555012225,
153
- "precision": 0.8233695652173914,
154
- "recall": 0.9659936238044633,
155
- "support": 941.0
156
  },
157
  "eval_I-Claim": {
158
- "f1-score": 0.5733916302311056,
159
- "precision": 0.6939824614454189,
160
- "recall": 0.4885057471264368,
161
- "support": 4698.0
162
  },
163
  "eval_I-MajorClaim": {
164
- "f1-score": 0.883077696756349,
165
- "precision": 0.900974858902001,
166
- "recall": 0.8658777120315582,
167
- "support": 2028.0
168
  },
169
  "eval_I-Premise": {
170
- "f1-score": 0.9034677264277932,
171
- "precision": 0.862554311241662,
172
- "recall": 0.9484556893883319,
173
- "support": 14861.0
174
  },
175
  "eval_O": {
176
- "f1-score": 0.9993631766248362,
177
- "precision": 0.9997751461549993,
178
- "recall": 0.9989515464689583,
179
- "support": 13353.0
180
  },
181
- "eval_accuracy": 0.8978559648158329,
182
- "eval_loss": 0.2462552785873413,
183
  "eval_macro avg": {
184
- "f1-score": 0.8057393926226919,
185
- "precision": 0.8467517403396473,
186
- "recall": 0.7842805031942245,
187
- "support": 36380.0
188
- },
189
- "eval_runtime": 1.4759,
190
- "eval_samples_per_second": 54.882,
191
- "eval_steps_per_second": 7.453,
192
  "eval_weighted avg": {
193
- "f1-score": 0.8908329908492291,
194
- "precision": 0.8911590560437058,
195
- "recall": 0.8978559648158329,
196
- "support": 36380.0
197
  },
198
  "step": 123
199
  },
200
  {
201
  "epoch": 4.0,
202
  "eval_B-Claim": {
203
- "f1-score": 0.5845070422535211,
204
- "precision": 0.7248908296943232,
205
- "recall": 0.4896755162241888,
206
- "support": 339.0
207
  },
208
  "eval_B-MajorClaim": {
209
- "f1-score": 0.8762541806020067,
210
- "precision": 0.9424460431654677,
211
- "recall": 0.81875,
212
- "support": 160.0
213
  },
214
  "eval_B-Premise": {
215
- "f1-score": 0.8968253968253969,
216
- "precision": 0.8409302325581396,
217
- "recall": 0.9606801275239107,
218
- "support": 941.0
219
  },
220
  "eval_I-Claim": {
221
- "f1-score": 0.5514666666666667,
222
- "precision": 0.7380442541042113,
223
- "recall": 0.44018731375053216,
224
- "support": 4698.0
225
  },
226
  "eval_I-MajorClaim": {
227
- "f1-score": 0.8924440068914595,
228
- "precision": 0.8909090909090909,
229
- "recall": 0.8939842209072978,
230
- "support": 2028.0
231
  },
232
  "eval_I-Premise": {
233
- "f1-score": 0.9053656685743194,
234
- "precision": 0.8539305737802696,
235
- "recall": 0.9633941188345333,
236
- "support": 14861.0
237
  },
238
  "eval_O": {
239
- "f1-score": 0.9991381571551693,
240
- "precision": 0.999850007499625,
241
- "recall": 0.9984273197034375,
242
- "support": 13353.0
243
  },
244
- "eval_accuracy": 0.8996976360637713,
245
- "eval_loss": 0.24545952677726746,
246
  "eval_macro avg": {
247
- "f1-score": 0.8151430169955056,
248
- "precision": 0.8558572902444468,
249
- "recall": 0.7950140881348429,
250
- "support": 36380.0
251
- },
252
- "eval_runtime": 1.4673,
253
- "eval_samples_per_second": 55.203,
254
- "eval_steps_per_second": 7.497,
255
  "eval_weighted avg": {
256
- "f1-score": 0.8900236150023304,
257
- "precision": 0.8934359443718076,
258
- "recall": 0.8996976360637713,
259
- "support": 36380.0
260
  },
261
  "step": 164
262
  },
263
  {
264
  "epoch": 5.0,
265
  "eval_B-Claim": {
266
- "f1-score": 0.6523887973640857,
267
- "precision": 0.7388059701492538,
268
- "recall": 0.584070796460177,
269
- "support": 339.0
270
  },
271
  "eval_B-MajorClaim": {
272
- "f1-score": 0.888888888888889,
273
- "precision": 0.9315068493150684,
274
- "recall": 0.85,
275
- "support": 160.0
276
  },
277
  "eval_B-Premise": {
278
- "f1-score": 0.9065040650406505,
279
- "precision": 0.8685491723466408,
280
- "recall": 0.9479277364505845,
281
- "support": 941.0
282
  },
283
  "eval_I-Claim": {
284
- "f1-score": 0.6614963503649636,
285
- "precision": 0.7125307125307125,
286
- "recall": 0.6172839506172839,
287
- "support": 4698.0
288
  },
289
  "eval_I-MajorClaim": {
290
- "f1-score": 0.8936275725266551,
291
- "precision": 0.8987531172069826,
292
- "recall": 0.888560157790927,
293
- "support": 2028.0
294
  },
295
  "eval_I-Premise": {
296
- "f1-score": 0.9151582965839531,
297
- "precision": 0.8955877616747182,
298
- "recall": 0.9356032568467801,
299
- "support": 14861.0
300
  },
301
  "eval_O": {
302
- "f1-score": 0.9985763524651581,
303
- "precision": 0.9991003823375065,
304
- "recall": 0.9980528720137797,
305
- "support": 13353.0
306
  },
307
- "eval_accuracy": 0.9114623419461243,
308
- "eval_loss": 0.2526456117630005,
309
  "eval_macro avg": {
310
- "f1-score": 0.8452343318906221,
311
- "precision": 0.8635477093658405,
312
- "recall": 0.8316426814542189,
313
- "support": 36380.0
314
- },
315
- "eval_runtime": 1.4686,
316
- "eval_samples_per_second": 55.156,
317
- "eval_steps_per_second": 7.49,
318
  "eval_weighted avg": {
319
- "f1-score": 0.9090309620899378,
320
- "precision": 0.9081159656876019,
321
- "recall": 0.9114623419461243,
322
- "support": 36380.0
323
  },
324
  "step": 205
325
  },
326
  {
327
  "epoch": 6.0,
328
  "eval_B-Claim": {
329
- "f1-score": 0.6990881458966565,
330
- "precision": 0.7210031347962382,
331
- "recall": 0.6784660766961652,
332
- "support": 339.0
333
  },
334
  "eval_B-MajorClaim": {
335
- "f1-score": 0.9221183800623053,
336
- "precision": 0.9192546583850931,
337
- "recall": 0.925,
338
- "support": 160.0
339
  },
340
  "eval_B-Premise": {
341
- "f1-score": 0.9045120671563485,
342
- "precision": 0.8932642487046633,
343
- "recall": 0.9160467587672688,
344
- "support": 941.0
345
  },
346
  "eval_I-Claim": {
347
- "f1-score": 0.6783031374281926,
348
- "precision": 0.7050987597611392,
349
- "recall": 0.6534695615155385,
350
- "support": 4698.0
351
  },
352
  "eval_I-MajorClaim": {
353
- "f1-score": 0.9009445386292081,
354
- "precision": 0.8852927177534508,
355
- "recall": 0.9171597633136095,
356
- "support": 2028.0
357
  },
358
  "eval_I-Premise": {
359
- "f1-score": 0.9145196724585581,
360
- "precision": 0.904881101376721,
361
- "recall": 0.9243657896507638,
362
- "support": 14861.0
363
  },
364
  "eval_O": {
365
- "f1-score": 0.9976737205463005,
366
- "precision": 0.9996992255056771,
367
- "recall": 0.99565640679997,
368
- "support": 13353.0
369
  },
370
- "eval_accuracy": 0.9126443100604728,
371
- "eval_loss": 0.26729828119277954,
372
  "eval_macro avg": {
373
- "f1-score": 0.8595942374539386,
374
- "precision": 0.8612134066118546,
375
- "recall": 0.8585949081061879,
376
- "support": 36380.0
377
- },
378
- "eval_runtime": 1.4686,
379
- "eval_samples_per_second": 55.156,
380
- "eval_steps_per_second": 7.49,
381
  "eval_weighted avg": {
382
- "f1-score": 0.9115468219984093,
383
- "precision": 0.9108414479595167,
384
- "recall": 0.9126443100604728,
385
- "support": 36380.0
386
  },
387
  "step": 246
388
  },
389
  {
390
  "epoch": 7.0,
391
  "eval_B-Claim": {
392
- "f1-score": 0.5932504440497335,
393
- "precision": 0.7455357142857143,
394
- "recall": 0.49262536873156343,
395
- "support": 339.0
396
  },
397
  "eval_B-MajorClaim": {
398
- "f1-score": 0.919093851132686,
399
- "precision": 0.9530201342281879,
400
- "recall": 0.8875,
401
- "support": 160.0
402
  },
403
  "eval_B-Premise": {
404
- "f1-score": 0.8955223880597015,
405
- "precision": 0.8419083255378859,
406
- "recall": 0.9564293304994687,
407
- "support": 941.0
408
  },
409
  "eval_I-Claim": {
410
- "f1-score": 0.5761658031088083,
411
- "precision": 0.7359364659166115,
412
- "recall": 0.4733929331630481,
413
- "support": 4698.0
414
  },
415
  "eval_I-MajorClaim": {
416
- "f1-score": 0.9135680866781581,
417
- "precision": 0.912444663059518,
418
- "recall": 0.9146942800788954,
419
- "support": 2028.0
420
  },
421
  "eval_I-Premise": {
422
- "f1-score": 0.9047619047619048,
423
- "precision": 0.8574441164065795,
424
- "recall": 0.9576071596796986,
425
- "support": 14861.0
426
  },
427
  "eval_O": {
428
- "f1-score": 0.9972596568940275,
429
- "precision": 0.9997741984043353,
430
- "recall": 0.9947577323447915,
431
- "support": 13353.0
432
  },
433
- "eval_accuracy": 0.9016492578339748,
434
- "eval_loss": 0.3082038462162018,
435
  "eval_macro avg": {
436
- "f1-score": 0.8285174478121456,
437
- "precision": 0.8637233739769761,
438
- "recall": 0.8110009720710665,
439
- "support": 36380.0
440
- },
441
- "eval_runtime": 1.471,
442
- "eval_samples_per_second": 55.064,
443
- "eval_steps_per_second": 7.478,
444
  "eval_weighted avg": {
445
- "f1-score": 0.8936908018647435,
446
- "precision": 0.8960358642584588,
447
- "recall": 0.9016492578339748,
448
- "support": 36380.0
449
  },
450
  "step": 287
451
  },
452
  {
453
  "epoch": 8.0,
454
  "eval_B-Claim": {
455
- "f1-score": 0.6687598116169545,
456
- "precision": 0.714765100671141,
457
- "recall": 0.6283185840707964,
458
- "support": 339.0
459
  },
460
  "eval_B-MajorClaim": {
461
- "f1-score": 0.9006622516556291,
462
- "precision": 0.9577464788732394,
463
- "recall": 0.85,
464
- "support": 160.0
465
  },
466
  "eval_B-Premise": {
467
- "f1-score": 0.9037570766855377,
468
- "precision": 0.8762475049900199,
469
- "recall": 0.9330499468650372,
470
- "support": 941.0
471
  },
472
  "eval_I-Claim": {
473
- "f1-score": 0.6700325367440816,
474
- "precision": 0.7084223013048636,
475
- "recall": 0.6355896126011068,
476
- "support": 4698.0
477
  },
478
  "eval_I-MajorClaim": {
479
- "f1-score": 0.9144028703229115,
480
- "precision": 0.951974386339381,
481
- "recall": 0.8796844181459567,
482
- "support": 2028.0
483
  },
484
  "eval_I-Premise": {
485
- "f1-score": 0.9123429999342408,
486
- "precision": 0.8920465505047258,
487
- "recall": 0.9335845501648611,
488
- "support": 14861.0
489
  },
490
  "eval_O": {
491
- "f1-score": 0.9972606852039475,
492
- "precision": 0.9993983152827918,
493
- "recall": 0.9951321800344491,
494
- "support": 13353.0
495
  },
496
- "eval_accuracy": 0.9114623419461243,
497
- "eval_loss": 0.3109261393547058,
498
  "eval_macro avg": {
499
- "f1-score": 0.8524597474519003,
500
- "precision": 0.8715143768523089,
501
- "recall": 0.8364798988403154,
502
- "support": 36380.0
503
- },
504
- "eval_runtime": 1.4725,
505
- "eval_samples_per_second": 55.007,
506
- "eval_steps_per_second": 7.47,
507
  "eval_weighted avg": {
508
- "f1-score": 0.9097917557931217,
509
- "precision": 0.9093055312257066,
510
- "recall": 0.9114623419461243,
511
- "support": 36380.0
512
  },
513
  "step": 328
514
  },
515
  {
516
  "epoch": 9.0,
517
  "eval_B-Claim": {
518
- "f1-score": 0.6548956661316213,
519
- "precision": 0.7183098591549296,
520
- "recall": 0.6017699115044248,
521
- "support": 339.0
522
  },
523
  "eval_B-MajorClaim": {
524
- "f1-score": 0.9049180327868853,
525
- "precision": 0.9517241379310345,
526
- "recall": 0.8625,
527
- "support": 160.0
528
  },
529
  "eval_B-Premise": {
530
- "f1-score": 0.9022017409114182,
531
- "precision": 0.8705533596837944,
532
- "recall": 0.9362380446333688,
533
- "support": 941.0
534
  },
535
  "eval_I-Claim": {
536
- "f1-score": 0.6574490148634635,
537
- "precision": 0.7166541070082894,
538
- "recall": 0.60727969348659,
539
- "support": 4698.0
540
  },
541
  "eval_I-MajorClaim": {
542
- "f1-score": 0.9180990899898889,
543
- "precision": 0.941908713692946,
544
- "recall": 0.8954635108481263,
545
- "support": 2028.0
546
  },
547
  "eval_I-Premise": {
548
- "f1-score": 0.9119628491072013,
549
- "precision": 0.8871285868804479,
550
- "recall": 0.938227575533275,
551
- "support": 14861.0
552
  },
553
  "eval_O": {
554
- "f1-score": 0.9979749493737343,
555
- "precision": 0.9994741981521821,
556
- "recall": 0.9964801917172171,
557
- "support": 13353.0
558
  },
559
- "eval_accuracy": 0.9109675645959319,
560
- "eval_loss": 0.3515395522117615,
561
  "eval_macro avg": {
562
- "f1-score": 0.8496430490234591,
563
- "precision": 0.8693932803576605,
564
- "recall": 0.8339941325318574,
565
- "support": 36380.0
566
- },
567
- "eval_runtime": 1.4698,
568
- "eval_samples_per_second": 55.111,
569
- "eval_steps_per_second": 7.484,
570
  "eval_weighted avg": {
571
- "f1-score": 0.908328976914783,
572
- "precision": 0.9076856069113689,
573
- "recall": 0.9109675645959319,
574
- "support": 36380.0
575
  },
576
  "step": 369
577
  },
578
  {
579
  "epoch": 10.0,
580
  "eval_B-Claim": {
581
- "f1-score": 0.6687697160883281,
582
- "precision": 0.7186440677966102,
583
- "recall": 0.6253687315634219,
584
- "support": 339.0
585
  },
586
  "eval_B-MajorClaim": {
587
- "f1-score": 0.9131832797427653,
588
- "precision": 0.9403973509933775,
589
- "recall": 0.8875,
590
- "support": 160.0
591
  },
592
  "eval_B-Premise": {
593
- "f1-score": 0.9038262668045501,
594
- "precision": 0.8801611278952669,
595
- "recall": 0.9287991498405951,
596
- "support": 941.0
597
  },
598
  "eval_I-Claim": {
599
- "f1-score": 0.6525114155251142,
600
- "precision": 0.7035942885278188,
601
- "recall": 0.6083439761600681,
602
- "support": 4698.0
603
  },
604
  "eval_I-MajorClaim": {
605
- "f1-score": 0.913640824337586,
606
- "precision": 0.9091796875,
607
- "recall": 0.9181459566074951,
608
- "support": 2028.0
609
  },
610
  "eval_I-Premise": {
611
- "f1-score": 0.909934821252222,
612
- "precision": 0.8907005220081201,
613
- "recall": 0.9300181683601373,
614
- "support": 14861.0
615
  },
616
  "eval_O": {
617
- "f1-score": 0.9979375257809279,
618
- "precision": 0.9993991287366681,
619
- "recall": 0.9964801917172171,
620
- "support": 13353.0
621
  },
622
- "eval_accuracy": 0.9091533809785597,
623
- "eval_loss": 0.36655083298683167,
624
  "eval_macro avg": {
625
- "f1-score": 0.8514005499330703,
626
- "precision": 0.8631537390654088,
627
- "recall": 0.8420937391784192,
628
- "support": 36380.0
629
- },
630
- "eval_runtime": 1.4773,
631
- "eval_samples_per_second": 54.829,
632
- "eval_steps_per_second": 7.446,
633
  "eval_weighted avg": {
634
- "f1-score": 0.9068083056033942,
635
- "precision": 0.9058079970815979,
636
- "recall": 0.9091533809785597,
637
- "support": 36380.0
638
  },
639
  "step": 410
640
  },
641
  {
642
  "epoch": 11.0,
643
  "eval_B-Claim": {
644
- "f1-score": 0.6924265842349304,
645
- "precision": 0.7272727272727273,
646
- "recall": 0.6607669616519174,
647
- "support": 339.0
648
  },
649
  "eval_B-MajorClaim": {
650
- "f1-score": 0.9345794392523364,
651
- "precision": 0.9316770186335404,
652
- "recall": 0.9375,
653
- "support": 160.0
654
  },
655
  "eval_B-Premise": {
656
- "f1-score": 0.9049111807732496,
657
- "precision": 0.8900308324768756,
658
- "recall": 0.9202975557917109,
659
- "support": 941.0
660
  },
661
  "eval_I-Claim": {
662
- "f1-score": 0.6834684134562007,
663
- "precision": 0.7143188674866559,
664
- "recall": 0.6551724137931034,
665
- "support": 4698.0
666
  },
667
  "eval_I-MajorClaim": {
668
- "f1-score": 0.9320293398533007,
669
- "precision": 0.9243452958292919,
670
- "recall": 0.9398422090729783,
671
- "support": 2028.0
672
  },
673
  "eval_I-Premise": {
674
- "f1-score": 0.9131185652607107,
675
- "precision": 0.9015017378188733,
676
- "recall": 0.9250386918780701,
677
- "support": 14861.0
678
  },
679
  "eval_O": {
680
- "f1-score": 0.9980128229162761,
681
- "precision": 0.9993242228562847,
682
- "recall": 0.9967048603310118,
683
- "support": 13353.0
684
  },
685
- "eval_accuracy": 0.9147883452446399,
686
- "eval_loss": 0.3872090280056,
687
  "eval_macro avg": {
688
- "f1-score": 0.8655066208210008,
689
- "precision": 0.8697815289106071,
690
- "recall": 0.8621889560741132,
691
- "support": 36380.0
692
- },
693
- "eval_runtime": 1.4746,
694
- "eval_samples_per_second": 54.93,
695
- "eval_steps_per_second": 7.46,
696
  "eval_weighted avg": {
697
- "f1-score": 0.9135018437004899,
698
- "precision": 0.9127204168171501,
699
- "recall": 0.9147883452446399,
700
- "support": 36380.0
701
  },
702
  "step": 451
703
  },
704
  {
705
  "epoch": 12.0,
706
  "eval_B-Claim": {
707
- "f1-score": 0.6677631578947368,
708
- "precision": 0.7546468401486989,
709
- "recall": 0.5988200589970502,
710
- "support": 339.0
711
  },
712
  "eval_B-MajorClaim": {
713
- "f1-score": 0.9411764705882352,
714
- "precision": 0.9325153374233128,
715
- "recall": 0.95,
716
- "support": 160.0
717
  },
718
  "eval_B-Premise": {
719
- "f1-score": 0.9050795279630579,
720
- "precision": 0.875,
721
- "recall": 0.9373007438894793,
722
- "support": 941.0
723
  },
724
  "eval_I-Claim": {
725
- "f1-score": 0.6464068644976761,
726
- "precision": 0.7343623070674249,
727
- "recall": 0.5772669220945083,
728
- "support": 4698.0
729
  },
730
  "eval_I-MajorClaim": {
731
- "f1-score": 0.9218900675024109,
732
- "precision": 0.9018867924528302,
733
- "recall": 0.9428007889546351,
734
- "support": 2028.0
735
  },
736
  "eval_I-Premise": {
737
- "f1-score": 0.9120062573328118,
738
- "precision": 0.8842823737597169,
739
- "recall": 0.9415247964470762,
740
- "support": 14861.0
741
  },
742
  "eval_O": {
743
- "f1-score": 0.997411561691113,
744
- "precision": 0.9992483463619964,
745
- "recall": 0.9955815172620385,
746
- "support": 13353.0
747
  },
748
- "eval_accuracy": 0.9111324903793293,
749
- "eval_loss": 0.46548593044281006,
750
  "eval_macro avg": {
751
- "f1-score": 0.8559619867814344,
752
- "precision": 0.8688488567448543,
753
- "recall": 0.8490421182349696,
754
- "support": 36380.0
755
- },
756
- "eval_runtime": 1.4688,
757
- "eval_samples_per_second": 55.148,
758
- "eval_steps_per_second": 7.489,
759
  "eval_weighted avg": {
760
- "f1-score": 0.907279105591616,
761
- "precision": 0.9068649475511307,
762
- "recall": 0.9111324903793293,
763
- "support": 36380.0
764
  },
765
  "step": 492
766
  }
@@ -770,7 +770,7 @@
770
  "num_input_tokens_seen": 0,
771
  "num_train_epochs": 16,
772
  "save_steps": 500,
773
- "total_flos": 1720131088788000.0,
774
  "train_batch_size": 8,
775
  "trial_name": null,
776
  "trial_params": null
 
14
  "f1-score": 0.0,
15
  "precision": 0.0,
16
  "recall": 0.0,
17
+ "support": 271.0
18
  },
19
  "eval_B-MajorClaim": {
20
  "f1-score": 0.0,
21
  "precision": 0.0,
22
  "recall": 0.0,
23
+ "support": 139.0
24
  },
25
  "eval_B-Premise": {
26
+ "f1-score": 0.778263585259213,
27
+ "precision": 0.643595041322314,
28
+ "recall": 0.9842022116903634,
29
+ "support": 633.0
30
  },
31
  "eval_I-Claim": {
32
+ "f1-score": 0.5213290460878884,
33
+ "precision": 0.4563708012760368,
34
+ "recall": 0.6078480379905024,
35
+ "support": 4001.0
36
  },
37
  "eval_I-MajorClaim": {
38
+ "f1-score": 0.520462355513902,
39
+ "precision": 0.7011784511784511,
40
+ "recall": 0.4138102334823646,
41
+ "support": 2013.0
42
  },
43
  "eval_I-Premise": {
44
+ "f1-score": 0.8648793805666204,
45
+ "precision": 0.8778050331607159,
46
+ "recall": 0.8523288637967537,
47
+ "support": 11336.0
48
  },
49
  "eval_O": {
50
+ "f1-score": 0.9947169811320755,
51
+ "precision": 0.9991081780076697,
52
+ "recall": 0.9903642149929278,
53
+ "support": 11312.0
54
  },
55
+ "eval_accuracy": 0.8332940582393537,
56
+ "eval_loss": 0.4083092212677002,
57
  "eval_macro avg": {
58
+ "f1-score": 0.5256644783656713,
59
+ "precision": 0.5254367864207411,
60
+ "recall": 0.5497933659932731,
61
+ "support": 29705.0
62
+ },
63
+ "eval_runtime": 1.4074,
64
+ "eval_samples_per_second": 56.843,
65
+ "eval_steps_per_second": 7.105,
66
  "eval_weighted avg": {
67
+ "f1-score": 0.830926787853407,
68
+ "precision": 0.8381591322948091,
69
+ "recall": 0.8332940582393537,
70
+ "support": 29705.0
71
  },
72
  "step": 41
73
  },
74
  {
75
  "epoch": 2.0,
76
  "eval_B-Claim": {
77
+ "f1-score": 0.29931972789115646,
78
+ "precision": 0.38823529411764707,
79
+ "recall": 0.24354243542435425,
80
+ "support": 271.0
81
  },
82
  "eval_B-MajorClaim": {
83
+ "f1-score": 0.2976190476190476,
84
+ "precision": 0.8620689655172413,
85
+ "recall": 0.17985611510791366,
86
+ "support": 139.0
87
  },
88
  "eval_B-Premise": {
89
+ "f1-score": 0.8474576271186441,
90
+ "precision": 0.7422802850356295,
91
+ "recall": 0.9873617693522907,
92
+ "support": 633.0
93
  },
94
  "eval_I-Claim": {
95
+ "f1-score": 0.42762951334379906,
96
+ "precision": 0.5749261291684254,
97
+ "recall": 0.340414896275931,
98
+ "support": 4001.0
99
  },
100
  "eval_I-MajorClaim": {
101
+ "f1-score": 0.7763546798029557,
102
+ "precision": 0.7699071812408402,
103
+ "recall": 0.7829110779930452,
104
+ "support": 2013.0
105
  },
106
  "eval_I-Premise": {
107
+ "f1-score": 0.8837899073120494,
108
+ "precision": 0.8290439755777108,
109
+ "recall": 0.9462773465067043,
110
+ "support": 11336.0
111
  },
112
  "eval_O": {
113
+ "f1-score": 0.9997789664471067,
114
+ "precision": 0.9999115748518879,
115
+ "recall": 0.9996463932107497,
116
+ "support": 11312.0
117
  },
118
+ "eval_accuracy": 0.8648039050664871,
119
+ "eval_loss": 0.29589229822158813,
120
  "eval_macro avg": {
121
+ "f1-score": 0.6474213527906798,
122
+ "precision": 0.7380533436441974,
123
+ "recall": 0.6400014334101413,
124
+ "support": 29705.0
125
+ },
126
+ "eval_runtime": 1.4156,
127
+ "eval_samples_per_second": 56.514,
128
+ "eval_steps_per_second": 7.064,
129
  "eval_weighted avg": {
130
+ "f1-score": 0.8503893311871605,
131
+ "precision": 0.850161508562683,
132
+ "recall": 0.8648039050664871,
133
+ "support": 29705.0
134
  },
135
  "step": 82
136
  },
137
  {
138
  "epoch": 3.0,
139
  "eval_B-Claim": {
140
+ "f1-score": 0.5958254269449716,
141
+ "precision": 0.61328125,
142
+ "recall": 0.5793357933579336,
143
+ "support": 271.0
144
  },
145
  "eval_B-MajorClaim": {
146
+ "f1-score": 0.7816901408450705,
147
+ "precision": 0.7655172413793103,
148
+ "recall": 0.7985611510791367,
149
+ "support": 139.0
150
  },
151
  "eval_B-Premise": {
152
+ "f1-score": 0.88,
153
+ "precision": 0.8738317757009346,
154
+ "recall": 0.8862559241706162,
155
+ "support": 633.0
156
  },
157
  "eval_I-Claim": {
158
+ "f1-score": 0.6080141575022121,
159
+ "precision": 0.6150895140664961,
160
+ "recall": 0.6010997250687328,
161
+ "support": 4001.0
162
  },
163
  "eval_I-MajorClaim": {
164
+ "f1-score": 0.8229895104895104,
165
+ "precision": 0.7346859149434257,
166
+ "recall": 0.9354197714853453,
167
+ "support": 2013.0
168
  },
169
  "eval_I-Premise": {
170
+ "f1-score": 0.8927189271892718,
171
+ "precision": 0.9111703104905383,
172
+ "recall": 0.875,
173
+ "support": 11336.0
174
  },
175
  "eval_O": {
176
+ "f1-score": 0.9996020340481981,
177
+ "precision": 1.0,
178
+ "recall": 0.9992043847241867,
179
+ "support": 11312.0
180
  },
181
+ "eval_accuracy": 0.8866857431408853,
182
+ "eval_loss": 0.2633354663848877,
183
  "eval_macro avg": {
184
+ "f1-score": 0.7972628852884621,
185
+ "precision": 0.7876537152258151,
186
+ "recall": 0.8106966785551358,
187
+ "support": 29705.0
188
+ },
189
+ "eval_runtime": 1.4195,
190
+ "eval_samples_per_second": 56.358,
191
+ "eval_steps_per_second": 7.045,
192
  "eval_weighted avg": {
193
+ "f1-score": 0.8868495578802252,
194
+ "precision": 0.8889636142603039,
195
+ "recall": 0.8866857431408853,
196
+ "support": 29705.0
197
  },
198
  "step": 123
199
  },
200
  {
201
  "epoch": 4.0,
202
  "eval_B-Claim": {
203
+ "f1-score": 0.6368515205724509,
204
+ "precision": 0.6180555555555556,
205
+ "recall": 0.6568265682656826,
206
+ "support": 271.0
207
  },
208
  "eval_B-MajorClaim": {
209
+ "f1-score": 0.8129032258064516,
210
+ "precision": 0.7368421052631579,
211
+ "recall": 0.9064748201438849,
212
+ "support": 139.0
213
  },
214
  "eval_B-Premise": {
215
+ "f1-score": 0.8759244042728019,
216
+ "precision": 0.9126712328767124,
217
+ "recall": 0.8420221169036335,
218
+ "support": 633.0
219
  },
220
  "eval_I-Claim": {
221
+ "f1-score": 0.6030037546933668,
222
+ "precision": 0.6039107545750815,
223
+ "recall": 0.6020994751312172,
224
+ "support": 4001.0
225
  },
226
  "eval_I-MajorClaim": {
227
+ "f1-score": 0.8346312414109024,
228
+ "precision": 0.7743306417339566,
229
+ "recall": 0.905116741182315,
230
+ "support": 2013.0
231
  },
232
  "eval_I-Premise": {
233
+ "f1-score": 0.8875363616021481,
234
+ "precision": 0.9007175946952494,
235
+ "recall": 0.8747353563867325,
236
+ "support": 11336.0
237
  },
238
  "eval_O": {
239
+ "f1-score": 0.9999557971975424,
240
+ "precision": 1.0,
241
+ "recall": 0.9999115983026874,
242
+ "support": 11312.0
243
  },
244
+ "eval_accuracy": 0.8852045110250799,
245
+ "eval_loss": 0.27674925327301025,
246
  "eval_macro avg": {
247
+ "f1-score": 0.8072580436508092,
248
+ "precision": 0.7923611263856734,
249
+ "recall": 0.8267409537594504,
250
+ "support": 29705.0
251
+ },
252
+ "eval_runtime": 1.4101,
253
+ "eval_samples_per_second": 56.735,
254
+ "eval_steps_per_second": 7.092,
255
  "eval_weighted avg": {
256
+ "f1-score": 0.8855540596827394,
257
+ "precision": 0.8868925824921324,
258
+ "recall": 0.8852045110250799,
259
+ "support": 29705.0
260
  },
261
  "step": 164
262
  },
263
  {
264
  "epoch": 5.0,
265
  "eval_B-Claim": {
266
+ "f1-score": 0.6735042735042734,
267
+ "precision": 0.6273885350318471,
268
+ "recall": 0.7269372693726938,
269
+ "support": 271.0
270
  },
271
  "eval_B-MajorClaim": {
272
+ "f1-score": 0.8514851485148515,
273
+ "precision": 0.7865853658536586,
274
+ "recall": 0.9280575539568345,
275
+ "support": 139.0
276
  },
277
  "eval_B-Premise": {
278
+ "f1-score": 0.8740617180984154,
279
+ "precision": 0.9257950530035336,
280
+ "recall": 0.8278041074249605,
281
+ "support": 633.0
282
  },
283
  "eval_I-Claim": {
284
+ "f1-score": 0.6534240561896401,
285
+ "precision": 0.5824691841126981,
286
+ "recall": 0.744063984003999,
287
+ "support": 4001.0
288
  },
289
  "eval_I-MajorClaim": {
290
+ "f1-score": 0.8683019766611098,
291
+ "precision": 0.8339432753888381,
292
+ "recall": 0.9056135121708893,
293
+ "support": 2013.0
294
  },
295
  "eval_I-Premise": {
296
+ "f1-score": 0.8769748527624568,
297
+ "precision": 0.9326903957049115,
298
+ "recall": 0.8275405786873676,
299
+ "support": 11336.0
300
  },
301
  "eval_O": {
302
+ "f1-score": 0.9997347245556637,
303
+ "precision": 1.0,
304
+ "recall": 0.9994695898161244,
305
+ "support": 11312.0
306
  },
307
+ "eval_accuracy": 0.8866184144083488,
308
+ "eval_loss": 0.2875027358531952,
309
  "eval_macro avg": {
310
+ "f1-score": 0.8282123928980587,
311
+ "precision": 0.8126959727279266,
312
+ "recall": 0.8513552279189812,
313
+ "support": 29705.0
314
+ },
315
+ "eval_runtime": 1.4103,
316
+ "eval_samples_per_second": 56.726,
317
+ "eval_steps_per_second": 7.091,
318
  "eval_weighted avg": {
319
+ "f1-score": 0.8909875382676978,
320
+ "precision": 0.90084333519953,
321
+ "recall": 0.8866184144083488,
322
+ "support": 29705.0
323
  },
324
  "step": 205
325
  },
326
  {
327
  "epoch": 6.0,
328
  "eval_B-Claim": {
329
+ "f1-score": 0.6584070796460177,
330
+ "precision": 0.6326530612244898,
331
+ "recall": 0.6863468634686347,
332
+ "support": 271.0
333
  },
334
  "eval_B-MajorClaim": {
335
+ "f1-score": 0.8421052631578947,
336
+ "precision": 0.8818897637795275,
337
+ "recall": 0.8057553956834532,
338
+ "support": 139.0
339
  },
340
  "eval_B-Premise": {
341
+ "f1-score": 0.8780876494023905,
342
+ "precision": 0.8858520900321544,
343
+ "recall": 0.8704581358609794,
344
+ "support": 633.0
345
  },
346
  "eval_I-Claim": {
347
+ "f1-score": 0.6172492982903802,
348
+ "precision": 0.6304404482668752,
349
+ "recall": 0.6045988502874281,
350
+ "support": 4001.0
351
  },
352
  "eval_I-MajorClaim": {
353
+ "f1-score": 0.8752545824847251,
354
+ "precision": 0.8976501305483029,
355
+ "recall": 0.8539493293591655,
356
+ "support": 2013.0
357
  },
358
  "eval_I-Premise": {
359
+ "f1-score": 0.8908354033206956,
360
+ "precision": 0.8802859357505813,
361
+ "recall": 0.9016407904022583,
362
+ "support": 11336.0
363
  },
364
  "eval_O": {
365
+ "f1-score": 0.9994250585997965,
366
+ "precision": 1.0,
367
+ "recall": 0.9988507779349364,
368
+ "support": 11312.0
369
  },
370
+ "eval_accuracy": 0.8923413566739606,
371
+ "eval_loss": 0.2945018410682678,
372
  "eval_macro avg": {
373
+ "f1-score": 0.8230520478431285,
374
+ "precision": 0.829824489943133,
375
+ "recall": 0.8173714489995507,
376
+ "support": 29705.0
377
+ },
378
+ "eval_runtime": 1.4167,
379
+ "eval_samples_per_second": 56.47,
380
+ "eval_steps_per_second": 7.059,
381
  "eval_weighted avg": {
382
+ "f1-score": 0.8916619674856285,
383
+ "precision": 0.8912660947222903,
384
+ "recall": 0.8923413566739606,
385
+ "support": 29705.0
386
  },
387
  "step": 246
388
  },
389
  {
390
  "epoch": 7.0,
391
  "eval_B-Claim": {
392
+ "f1-score": 0.6748681898066783,
393
+ "precision": 0.6442953020134228,
394
+ "recall": 0.7084870848708487,
395
+ "support": 271.0
396
  },
397
  "eval_B-MajorClaim": {
398
+ "f1-score": 0.8705035971223022,
399
+ "precision": 0.8705035971223022,
400
+ "recall": 0.8705035971223022,
401
+ "support": 139.0
402
  },
403
  "eval_B-Premise": {
404
+ "f1-score": 0.8788368336025849,
405
+ "precision": 0.8991735537190083,
406
+ "recall": 0.8593996840442338,
407
+ "support": 633.0
408
  },
409
  "eval_I-Claim": {
410
+ "f1-score": 0.6305652826413206,
411
+ "precision": 0.6310387984981226,
412
+ "recall": 0.6300924768807799,
413
+ "support": 4001.0
414
  },
415
  "eval_I-MajorClaim": {
416
+ "f1-score": 0.8747152619589977,
417
+ "precision": 0.891640866873065,
418
+ "recall": 0.8584202682563339,
419
+ "support": 2013.0
420
  },
421
  "eval_I-Premise": {
422
+ "f1-score": 0.8918871407225103,
423
+ "precision": 0.8886845331932037,
424
+ "recall": 0.8951129146083274,
425
+ "support": 11336.0
426
  },
427
  "eval_O": {
428
+ "f1-score": 1.0,
429
+ "precision": 1.0,
430
+ "recall": 1.0,
431
+ "support": 11312.0
432
  },
433
+ "eval_accuracy": 0.8942938899175223,
434
+ "eval_loss": 0.30371928215026855,
435
  "eval_macro avg": {
436
+ "f1-score": 0.8316251865506278,
437
+ "precision": 0.832190950202732,
438
+ "recall": 0.8317165751118323,
439
+ "support": 29705.0
440
+ },
441
+ "eval_runtime": 1.4098,
442
+ "eval_samples_per_second": 56.745,
443
+ "eval_steps_per_second": 7.093,
444
  "eval_weighted avg": {
445
+ "f1-score": 0.894338297946804,
446
+ "precision": 0.8944813348740749,
447
+ "recall": 0.8942938899175223,
448
+ "support": 29705.0
449
  },
450
  "step": 287
451
  },
452
  {
453
  "epoch": 8.0,
454
  "eval_B-Claim": {
455
+ "f1-score": 0.6325757575757576,
456
+ "precision": 0.6498054474708171,
457
+ "recall": 0.6162361623616236,
458
+ "support": 271.0
459
  },
460
  "eval_B-MajorClaim": {
461
+ "f1-score": 0.8602941176470588,
462
+ "precision": 0.8796992481203008,
463
+ "recall": 0.841726618705036,
464
+ "support": 139.0
465
  },
466
  "eval_B-Premise": {
467
+ "f1-score": 0.8780108780108781,
468
+ "precision": 0.863914373088685,
469
+ "recall": 0.8925750394944708,
470
+ "support": 633.0
471
  },
472
  "eval_I-Claim": {
473
+ "f1-score": 0.5998663994655979,
474
+ "precision": 0.644374282433984,
475
+ "recall": 0.5611097225693576,
476
+ "support": 4001.0
477
  },
478
  "eval_I-MajorClaim": {
479
+ "f1-score": 0.8755122950819673,
480
+ "precision": 0.9037546271813856,
481
+ "recall": 0.8489816194734228,
482
+ "support": 2013.0
483
  },
484
  "eval_I-Premise": {
485
+ "f1-score": 0.8923684097636309,
486
+ "precision": 0.8685594989561587,
487
+ "recall": 0.9175194071983063,
488
+ "support": 11336.0
489
  },
490
  "eval_O": {
491
+ "f1-score": 0.9999557971975424,
492
+ "precision": 1.0,
493
+ "recall": 0.9999115983026874,
494
+ "support": 11312.0
495
  },
496
+ "eval_accuracy": 0.892610671604107,
497
+ "eval_loss": 0.3549477458000183,
498
  "eval_macro avg": {
499
+ "f1-score": 0.8197976649632047,
500
+ "precision": 0.8300153538930474,
501
+ "recall": 0.811151452586415,
502
+ "support": 29705.0
503
+ },
504
+ "eval_runtime": 1.4225,
505
+ "eval_samples_per_second": 56.239,
506
+ "eval_steps_per_second": 7.03,
507
  "eval_weighted avg": {
508
+ "f1-score": 0.8899730612246367,
509
+ "precision": 0.8887602531095763,
510
+ "recall": 0.892610671604107,
511
+ "support": 29705.0
512
  },
513
  "step": 328
514
  },
515
  {
516
  "epoch": 9.0,
517
  "eval_B-Claim": {
518
+ "f1-score": 0.6642728904847396,
519
+ "precision": 0.6468531468531469,
520
+ "recall": 0.6826568265682657,
521
+ "support": 271.0
522
  },
523
  "eval_B-MajorClaim": {
524
+ "f1-score": 0.8480565371024734,
525
+ "precision": 0.8333333333333334,
526
+ "recall": 0.8633093525179856,
527
+ "support": 139.0
528
  },
529
  "eval_B-Premise": {
530
+ "f1-score": 0.8805132317562149,
531
+ "precision": 0.8941368078175895,
532
+ "recall": 0.8672985781990521,
533
+ "support": 633.0
534
  },
535
  "eval_I-Claim": {
536
+ "f1-score": 0.637490882567469,
537
+ "precision": 0.6205917159763313,
538
+ "recall": 0.6553361659585104,
539
+ "support": 4001.0
540
  },
541
  "eval_I-MajorClaim": {
542
+ "f1-score": 0.8618255168935955,
543
+ "precision": 0.8750640040962622,
544
+ "recall": 0.8489816194734228,
545
+ "support": 2013.0
546
  },
547
  "eval_I-Premise": {
548
+ "f1-score": 0.8898067954696869,
549
+ "precision": 0.8960551033187226,
550
+ "recall": 0.8836450247000706,
551
+ "support": 11336.0
552
  },
553
  "eval_O": {
554
+ "f1-score": 0.9996462681287585,
555
+ "precision": 1.0,
556
+ "recall": 0.9992927864214993,
557
+ "support": 11312.0
558
  },
559
+ "eval_accuracy": 0.8923076923076924,
560
+ "eval_loss": 0.3715985417366028,
561
  "eval_macro avg": {
562
+ "f1-score": 0.8259445889147053,
563
+ "precision": 0.8237191587707694,
564
+ "recall": 0.8286457648341152,
565
+ "support": 29705.0
566
+ },
567
+ "eval_runtime": 1.4176,
568
+ "eval_samples_per_second": 56.435,
569
+ "eval_steps_per_second": 7.054,
570
  "eval_weighted avg": {
571
+ "f1-score": 0.8933030430182268,
572
+ "precision": 0.8945056752252882,
573
+ "recall": 0.8923076923076924,
574
+ "support": 29705.0
575
  },
576
  "step": 369
577
  },
578
  {
579
  "epoch": 10.0,
580
  "eval_B-Claim": {
581
+ "f1-score": 0.6461538461538461,
582
+ "precision": 0.6746987951807228,
583
+ "recall": 0.6199261992619927,
584
+ "support": 271.0
585
  },
586
  "eval_B-MajorClaim": {
587
+ "f1-score": 0.852233676975945,
588
+ "precision": 0.8157894736842105,
589
+ "recall": 0.8920863309352518,
590
+ "support": 139.0
591
  },
592
  "eval_B-Premise": {
593
+ "f1-score": 0.8847058823529412,
594
+ "precision": 0.8785046728971962,
595
+ "recall": 0.8909952606635071,
596
+ "support": 633.0
597
  },
598
  "eval_I-Claim": {
599
+ "f1-score": 0.6189843126827972,
600
+ "precision": 0.6611758023288838,
601
+ "recall": 0.5818545363659086,
602
+ "support": 4001.0
603
  },
604
  "eval_I-MajorClaim": {
605
+ "f1-score": 0.8606089438629877,
606
+ "precision": 0.8256503879507074,
607
+ "recall": 0.8986587183308494,
608
+ "support": 2013.0
609
  },
610
  "eval_I-Premise": {
611
+ "f1-score": 0.8974191582887234,
612
+ "precision": 0.8856627437505369,
613
+ "recall": 0.9094918842625265,
614
+ "support": 11336.0
615
  },
616
  "eval_O": {
617
+ "f1-score": 0.9998673798682641,
618
+ "precision": 1.0,
619
+ "recall": 0.9997347949080623,
620
+ "support": 11312.0
621
  },
622
+ "eval_accuracy": 0.8958761151321326,
623
+ "eval_loss": 0.4143347144126892,
624
  "eval_macro avg": {
625
+ "f1-score": 0.822853314312215,
626
+ "precision": 0.8202116965417511,
627
+ "recall": 0.8275353892468712,
628
+ "support": 29705.0
629
+ },
630
+ "eval_runtime": 1.4266,
631
+ "eval_samples_per_second": 56.076,
632
+ "eval_steps_per_second": 7.01,
633
  "eval_weighted avg": {
634
+ "f1-score": 0.8936607445011815,
635
+ "precision": 0.8924963153509083,
636
+ "recall": 0.8958761151321326,
637
+ "support": 29705.0
638
  },
639
  "step": 410
640
  },
641
  {
642
  "epoch": 11.0,
643
  "eval_B-Claim": {
644
+ "f1-score": 0.6748681898066783,
645
+ "precision": 0.6442953020134228,
646
+ "recall": 0.7084870848708487,
647
+ "support": 271.0
648
  },
649
  "eval_B-MajorClaim": {
650
+ "f1-score": 0.8754448398576513,
651
+ "precision": 0.8661971830985915,
652
+ "recall": 0.8848920863309353,
653
+ "support": 139.0
654
  },
655
  "eval_B-Premise": {
656
+ "f1-score": 0.8770226537216829,
657
+ "precision": 0.8988391376451078,
658
+ "recall": 0.8562401263823065,
659
+ "support": 633.0
660
  },
661
  "eval_I-Claim": {
662
+ "f1-score": 0.6444880923152466,
663
+ "precision": 0.6332931242460796,
664
+ "recall": 0.6560859785053736,
665
+ "support": 4001.0
666
  },
667
  "eval_I-MajorClaim": {
668
+ "f1-score": 0.8760289348964829,
669
+ "precision": 0.8797595190380761,
670
+ "recall": 0.8723298559364133,
671
+ "support": 2013.0
672
  },
673
  "eval_I-Premise": {
674
+ "f1-score": 0.8931358637814828,
675
+ "precision": 0.8979136947218259,
676
+ "recall": 0.8884086097388849,
677
+ "support": 11336.0
678
  },
679
  "eval_O": {
680
+ "f1-score": 0.9996904982977407,
681
+ "precision": 1.0,
682
+ "recall": 0.9993811881188119,
683
+ "support": 11312.0
684
  },
685
+ "eval_accuracy": 0.8959434438646693,
686
+ "eval_loss": 0.4241807460784912,
687
  "eval_macro avg": {
688
+ "f1-score": 0.8343827246681379,
689
+ "precision": 0.8314711372518719,
690
+ "recall": 0.8379749899833678,
691
+ "support": 29705.0
692
+ },
693
+ "eval_runtime": 1.4169,
694
+ "eval_samples_per_second": 56.462,
695
+ "eval_steps_per_second": 7.058,
696
  "eval_weighted avg": {
697
+ "f1-score": 0.8966457372110589,
698
+ "precision": 0.8974745650471141,
699
+ "recall": 0.8959434438646693,
700
+ "support": 29705.0
701
  },
702
  "step": 451
703
  },
704
  {
705
  "epoch": 12.0,
706
  "eval_B-Claim": {
707
+ "f1-score": 0.6175869120654396,
708
+ "precision": 0.6926605504587156,
709
+ "recall": 0.5571955719557196,
710
+ "support": 271.0
711
  },
712
  "eval_B-MajorClaim": {
713
+ "f1-score": 0.8695652173913043,
714
+ "precision": 0.8759124087591241,
715
+ "recall": 0.8633093525179856,
716
+ "support": 139.0
717
  },
718
  "eval_B-Premise": {
719
+ "f1-score": 0.8819969742813918,
720
+ "precision": 0.8461538461538461,
721
+ "recall": 0.9210110584518167,
722
+ "support": 633.0
723
  },
724
  "eval_I-Claim": {
725
+ "f1-score": 0.5798017526217497,
726
+ "precision": 0.6817567567567567,
727
+ "recall": 0.5043739065233691,
728
+ "support": 4001.0
729
  },
730
  "eval_I-MajorClaim": {
731
+ "f1-score": 0.8793675082887019,
732
+ "precision": 0.9035639412997903,
733
+ "recall": 0.8564331843020367,
734
+ "support": 2013.0
735
  },
736
  "eval_I-Premise": {
737
+ "f1-score": 0.8959295006294586,
738
+ "precision": 0.8544101168560909,
739
+ "recall": 0.9416901905434015,
740
+ "support": 11336.0
741
  },
742
  "eval_O": {
743
+ "f1-score": 0.9994250585997965,
744
+ "precision": 1.0,
745
+ "recall": 0.9988507779349364,
746
+ "support": 11312.0
747
  },
748
+ "eval_accuracy": 0.8944622117488639,
749
+ "eval_loss": 0.49107131361961365,
750
  "eval_macro avg": {
751
+ "f1-score": 0.8176675605539775,
752
+ "precision": 0.8363510886120462,
753
+ "recall": 0.8061234346041807,
754
+ "support": 29705.0
755
+ },
756
+ "eval_runtime": 1.4189,
757
+ "eval_samples_per_second": 56.383,
758
+ "eval_steps_per_second": 7.048,
759
  "eval_weighted avg": {
760
+ "f1-score": 0.8886802353660483,
761
+ "precision": 0.888377522333214,
762
+ "recall": 0.8944622117488639,
763
+ "support": 29705.0
764
  },
765
  "step": 492
766
  }
 
770
  "num_input_tokens_seen": 0,
771
  "num_train_epochs": 16,
772
  "save_steps": 500,
773
+ "total_flos": 1725489752616000.0,
774
  "train_batch_size": 8,
775
  "trial_name": null,
776
  "trial_params": null
checkpoint-492/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3e60aef760c0bebacd32c85d34779d7bd28b7fb5a467a761ffe5e8a7e5bb2bb
3
  size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e06f6b44c30fa94c6272333e445e6562930fffeb3ba856f3a9330b45193b951f
3
  size 4728