nlpso commited on
Commit
cab6869
·
1 Parent(s): 44937ca

Load model and tokenizer

Browse files
config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "HueyNemud/das22-10-camembert_pretrained",
3
+ "architectures": [
4
+ "CamembertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 5,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 6,
10
+ "gradient_checkpointing": false,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "O+O",
16
+ "1": "I-PER+O",
17
+ "2": "I-PER+i_TITREH",
18
+ "3": "I-ACT+O",
19
+ "4": "I-DESC+O",
20
+ "5": "I-DESC+i_ACT",
21
+ "6": "I-DESC+i_TITREP",
22
+ "7": "I-SPAT+O",
23
+ "8": "I-SPAT+i_LOC",
24
+ "9": "I-SPAT+i_CARDINAL",
25
+ "10": "I-SPAT+i_FT",
26
+ "11": "I-TITRE+O"
27
+ },
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 3072,
30
+ "label2id": {
31
+ "I-ACT+O": 3,
32
+ "I-DESC+O": 4,
33
+ "I-DESC+i_ACT": 5,
34
+ "I-DESC+i_TITREP": 6,
35
+ "I-PER+O": 1,
36
+ "I-PER+i_TITREH": 2,
37
+ "I-SPAT+O": 7,
38
+ "I-SPAT+i_CARDINAL": 9,
39
+ "I-SPAT+i_FT": 10,
40
+ "I-SPAT+i_LOC": 8,
41
+ "I-TITRE+O": 11,
42
+ "O+O": 0
43
+ },
44
+ "layer_norm_eps": 1e-05,
45
+ "max_position_embeddings": 514,
46
+ "model_type": "camembert",
47
+ "num_attention_heads": 12,
48
+ "num_hidden_layers": 12,
49
+ "output_past": true,
50
+ "pad_token_id": 1,
51
+ "position_embedding_type": "absolute",
52
+ "torch_dtype": "float32",
53
+ "transformers_version": "4.25.1",
54
+ "type_vocab_size": 1,
55
+ "use_cache": true,
56
+ "vocab_size": 32005
57
+ }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:108ceefd1b23089d94252bdb7f0c9e62753dad634c7db074c18d13b5d43234cf
3
+ size 880440037
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a1e09bbad0436728b8cbb17445070c91de69aa77b121da59d30ee88ca589667
3
+ size 440233393
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:525248a12ab5a80da311ba4bae6b44d175fe28c236b0a5d1a41fb9b5be2722b0
3
+ size 14503
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec6331a2d4f82e15c898be3d09fa0a39ccbc9d6fd132b0505ce16e06776b6d8e
3
+ size 623
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:988bc5a00281c6d210a5d34bd143d0363741a432fefe741bf71e61b1869d4314
3
+ size 810912
special_tokens_map.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": "<mask>",
10
+ "pad_token": "<pad>",
11
+ "sep_token": "</s>",
12
+ "unk_token": "<unk>"
13
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": {
10
+ "__type": "AddedToken",
11
+ "content": "<mask>",
12
+ "lstrip": true,
13
+ "normalized": true,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ "model_max_length": 512,
18
+ "name_or_path": "HueyNemud/das22-10-camembert_pretrained",
19
+ "pad_token": "<pad>",
20
+ "sep_token": "</s>",
21
+ "sp_model_kwargs": {},
22
+ "special_tokens_map_file": "/lrde/home2/jchazalo/.cache/huggingface/transformers/fe0e213c44079a9ee091098f81fff2941484006e9ba3001a9bf1ee9f87537599.cb3ec3a6c1200d181228d8825ae9767572abca54efa1bbb37fd83d721b2ef323",
23
+ "tokenizer_class": "CamembertTokenizer",
24
+ "unk_token": "<unk>"
25
+ }
trainer_state.json ADDED
@@ -0,0 +1,1028 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9649173673528558,
3
+ "best_model_checkpoint": "/work/stual/res_ICDAR/method_3/tmp/323-pretrained-camembert-ner-hierarchical-loss-io/checkpoint-1000",
4
+ "epoch": 2.6246719160104988,
5
+ "global_step": 1000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.26,
12
+ "eval_ACT": {
13
+ "f1": 0.9041353383458647,
14
+ "number": 519,
15
+ "precision": 0.8825688073394495,
16
+ "recall": 0.9267822736030829
17
+ },
18
+ "eval_ACT_L1": {
19
+ "f1": 0.9179389312977099,
20
+ "number": 503,
21
+ "precision": 0.8825688073394495,
22
+ "recall": 0.9562624254473161
23
+ },
24
+ "eval_ACT_L2": {
25
+ "f1": 0.0,
26
+ "number": 16,
27
+ "precision": 0.0,
28
+ "recall": 0.0
29
+ },
30
+ "eval_CARDINAL": {
31
+ "f1": 0.9730123997082422,
32
+ "number": 678,
33
+ "precision": 0.9624819624819625,
34
+ "recall": 0.9837758112094396
35
+ },
36
+ "eval_DESC": {
37
+ "f1": 0.0,
38
+ "number": 30,
39
+ "precision": 0.0,
40
+ "recall": 0.0
41
+ },
42
+ "eval_FT": {
43
+ "f1": 0.0,
44
+ "number": 7,
45
+ "precision": 0.0,
46
+ "recall": 0.0
47
+ },
48
+ "eval_LOC": {
49
+ "f1": 0.9365598430346632,
50
+ "number": 761,
51
+ "precision": 0.9322916666666666,
52
+ "recall": 0.9408672798948752
53
+ },
54
+ "eval_PER": {
55
+ "f1": 0.931667891256429,
56
+ "number": 676,
57
+ "precision": 0.9255474452554745,
58
+ "recall": 0.9378698224852071
59
+ },
60
+ "eval_SPAT": {
61
+ "f1": 0.9334287759484609,
62
+ "number": 694,
63
+ "precision": 0.9274537695590327,
64
+ "recall": 0.9394812680115274
65
+ },
66
+ "eval_TITRE": {
67
+ "f1": 0.0,
68
+ "number": 2,
69
+ "precision": 0.0,
70
+ "recall": 0.0
71
+ },
72
+ "eval_TITREH": {
73
+ "f1": 0.0,
74
+ "number": 33,
75
+ "precision": 0.0,
76
+ "recall": 0.0
77
+ },
78
+ "eval_TITREP": {
79
+ "f1": 0.0,
80
+ "number": 6,
81
+ "precision": 0.0,
82
+ "recall": 0.0
83
+ },
84
+ "eval_accuracy": 0.9357124778537079,
85
+ "eval_accuracy-all": 0.9560870665654265,
86
+ "eval_accuracy-das": 0.94874715261959,
87
+ "eval_accuracy-l1": 0.9444444444444444,
88
+ "eval_accuracy-l2": 0.9677296886864085,
89
+ "eval_f1": 0.9315068493150684,
90
+ "eval_f1-all": 0.9264705882352942,
91
+ "eval_f1-das": 0.9278273809523809,
92
+ "eval_f1-l1": 0.9207920792079207,
93
+ "eval_f1-l2": 0.9338284942606346,
94
+ "eval_loss": 0.3864385783672333,
95
+ "eval_precision": 0.9339567504383401,
96
+ "eval_precision-all": 0.9281084266352386,
97
+ "eval_precision-das": 0.9267930137495355,
98
+ "eval_precision-l1": 0.9141231246766683,
99
+ "eval_precision-l2": 0.946611909650924,
100
+ "eval_recall": 0.9290697674418604,
101
+ "eval_recall-all": 0.9248385202583675,
102
+ "eval_recall-das": 0.9288640595903166,
103
+ "eval_recall-l1": 0.9275590551181102,
104
+ "eval_recall-l2": 0.9213857428381079,
105
+ "eval_runtime": 5.8217,
106
+ "eval_samples_per_second": 116.117,
107
+ "eval_steps_per_second": 7.386,
108
+ "step": 100
109
+ },
110
+ {
111
+ "epoch": 0.52,
112
+ "eval_ACT": {
113
+ "f1": 0.9251184834123224,
114
+ "number": 519,
115
+ "precision": 0.9104477611940298,
116
+ "recall": 0.9402697495183044
117
+ },
118
+ "eval_ACT_L1": {
119
+ "f1": 0.9393647738209817,
120
+ "number": 503,
121
+ "precision": 0.9104477611940298,
122
+ "recall": 0.9701789264413518
123
+ },
124
+ "eval_ACT_L2": {
125
+ "f1": 0.0,
126
+ "number": 16,
127
+ "precision": 0.0,
128
+ "recall": 0.0
129
+ },
130
+ "eval_CARDINAL": {
131
+ "f1": 0.9874723655121592,
132
+ "number": 678,
133
+ "precision": 0.9867452135493373,
134
+ "recall": 0.9882005899705014
135
+ },
136
+ "eval_DESC": {
137
+ "f1": 0.2153846153846154,
138
+ "number": 30,
139
+ "precision": 0.2,
140
+ "recall": 0.23333333333333334
141
+ },
142
+ "eval_FT": {
143
+ "f1": 0.0,
144
+ "number": 7,
145
+ "precision": 0.0,
146
+ "recall": 0.0
147
+ },
148
+ "eval_LOC": {
149
+ "f1": 0.9395711500974658,
150
+ "number": 761,
151
+ "precision": 0.929305912596401,
152
+ "recall": 0.9500657030223391
153
+ },
154
+ "eval_PER": {
155
+ "f1": 0.9690721649484536,
156
+ "number": 676,
157
+ "precision": 0.9648093841642229,
158
+ "recall": 0.9733727810650887
159
+ },
160
+ "eval_SPAT": {
161
+ "f1": 0.9549033643521831,
162
+ "number": 694,
163
+ "precision": 0.9487908961593172,
164
+ "recall": 0.9610951008645533
165
+ },
166
+ "eval_TITRE": {
167
+ "f1": 0.0,
168
+ "number": 2,
169
+ "precision": 0.0,
170
+ "recall": 0.0
171
+ },
172
+ "eval_TITREH": {
173
+ "f1": 0.6666666666666666,
174
+ "number": 33,
175
+ "precision": 0.7,
176
+ "recall": 0.6363636363636364
177
+ },
178
+ "eval_TITREP": {
179
+ "f1": 0.0,
180
+ "number": 6,
181
+ "precision": 0.0,
182
+ "recall": 0.0
183
+ },
184
+ "eval_accuracy": 0.9536826119969628,
185
+ "eval_accuracy-all": 0.9668438370032904,
186
+ "eval_accuracy-das": 0.9674765882055176,
187
+ "eval_accuracy-l1": 0.960642875221463,
188
+ "eval_accuracy-l2": 0.9730447987851177,
189
+ "eval_f1": 0.947444621398581,
190
+ "eval_f1-all": 0.9443714410862899,
191
+ "eval_f1-das": 0.9526989426822481,
192
+ "eval_f1-l1": 0.9427609427609427,
193
+ "eval_f1-l2": 0.9464524765729585,
194
+ "eval_loss": 0.2513241171836853,
195
+ "eval_precision": 0.9437554081338333,
196
+ "eval_precision-all": 0.939297124600639,
197
+ "eval_precision-das": 0.9490022172949002,
198
+ "eval_precision-l1": 0.9304703476482618,
199
+ "eval_precision-l2": 0.9509078681909886,
200
+ "eval_recall": 0.9511627906976744,
201
+ "eval_recall-all": 0.9495008807985907,
202
+ "eval_recall-das": 0.9564245810055866,
203
+ "eval_recall-l1": 0.9553805774278216,
204
+ "eval_recall-l2": 0.9420386409060626,
205
+ "eval_runtime": 5.7364,
206
+ "eval_samples_per_second": 117.843,
207
+ "eval_steps_per_second": 7.496,
208
+ "step": 200
209
+ },
210
+ {
211
+ "epoch": 0.79,
212
+ "eval_ACT": {
213
+ "f1": 0.9367816091954023,
214
+ "number": 519,
215
+ "precision": 0.9314285714285714,
216
+ "recall": 0.9421965317919075
217
+ },
218
+ "eval_ACT_L1": {
219
+ "f1": 0.9513618677042801,
220
+ "number": 503,
221
+ "precision": 0.9314285714285714,
222
+ "recall": 0.9721669980119284
223
+ },
224
+ "eval_ACT_L2": {
225
+ "f1": 0.0,
226
+ "number": 16,
227
+ "precision": 0.0,
228
+ "recall": 0.0
229
+ },
230
+ "eval_CARDINAL": {
231
+ "f1": 0.9794419970631425,
232
+ "number": 678,
233
+ "precision": 0.9751461988304093,
234
+ "recall": 0.9837758112094396
235
+ },
236
+ "eval_DESC": {
237
+ "f1": 0.30985915492957744,
238
+ "number": 30,
239
+ "precision": 0.2682926829268293,
240
+ "recall": 0.36666666666666664
241
+ },
242
+ "eval_FT": {
243
+ "f1": 0.0,
244
+ "number": 7,
245
+ "precision": 0.0,
246
+ "recall": 0.0
247
+ },
248
+ "eval_LOC": {
249
+ "f1": 0.9495743287491814,
250
+ "number": 761,
251
+ "precision": 0.9464751958224543,
252
+ "recall": 0.9526938239159002
253
+ },
254
+ "eval_PER": {
255
+ "f1": 0.9697416974169741,
256
+ "number": 676,
257
+ "precision": 0.96759941089838,
258
+ "recall": 0.9718934911242604
259
+ },
260
+ "eval_SPAT": {
261
+ "f1": 0.9533381191672649,
262
+ "number": 694,
263
+ "precision": 0.949928469241774,
264
+ "recall": 0.9567723342939481
265
+ },
266
+ "eval_TITRE": {
267
+ "f1": 0.0,
268
+ "number": 2,
269
+ "precision": 0.0,
270
+ "recall": 0.0
271
+ },
272
+ "eval_TITREH": {
273
+ "f1": 0.71875,
274
+ "number": 33,
275
+ "precision": 0.7419354838709677,
276
+ "recall": 0.696969696969697
277
+ },
278
+ "eval_TITREP": {
279
+ "f1": 0.3636363636363636,
280
+ "number": 6,
281
+ "precision": 0.4,
282
+ "recall": 0.3333333333333333
283
+ },
284
+ "eval_accuracy": 0.9588711718552265,
285
+ "eval_accuracy-all": 0.9708301695773222,
286
+ "eval_accuracy-das": 0.9702606934953176,
287
+ "eval_accuracy-l1": 0.9658314350797267,
288
+ "eval_accuracy-l2": 0.9758289040749177,
289
+ "eval_f1": 0.9527125036263417,
290
+ "eval_f1-all": 0.9473376243417203,
291
+ "eval_f1-das": 0.9568612867236892,
292
+ "eval_f1-l1": 0.9462197973499611,
293
+ "eval_f1-l2": 0.9487780381653834,
294
+ "eval_loss": 0.19993722438812256,
295
+ "eval_precision": 0.950781702374059,
296
+ "eval_precision-all": 0.9440233236151604,
297
+ "eval_precision-das": 0.9554400297066469,
298
+ "eval_precision-l1": 0.9367283950617284,
299
+ "eval_precision-l2": 0.9535666218034994,
300
+ "eval_recall": 0.9546511627906977,
301
+ "eval_recall-all": 0.9506752789195537,
302
+ "eval_recall-das": 0.9582867783985103,
303
+ "eval_recall-l1": 0.9559055118110236,
304
+ "eval_recall-l2": 0.944037308461026,
305
+ "eval_runtime": 5.4991,
306
+ "eval_samples_per_second": 122.93,
307
+ "eval_steps_per_second": 7.819,
308
+ "step": 300
309
+ },
310
+ {
311
+ "epoch": 1.05,
312
+ "eval_ACT": {
313
+ "f1": 0.936372269705603,
314
+ "number": 519,
315
+ "precision": 0.9232209737827716,
316
+ "recall": 0.9499036608863198
317
+ },
318
+ "eval_ACT_L1": {
319
+ "f1": 0.9497098646034816,
320
+ "number": 503,
321
+ "precision": 0.9246704331450094,
322
+ "recall": 0.9761431411530815
323
+ },
324
+ "eval_ACT_L2": {
325
+ "f1": 0.21052631578947367,
326
+ "number": 16,
327
+ "precision": 0.6666666666666666,
328
+ "recall": 0.125
329
+ },
330
+ "eval_CARDINAL": {
331
+ "f1": 0.988962472406181,
332
+ "number": 678,
333
+ "precision": 0.986784140969163,
334
+ "recall": 0.9911504424778761
335
+ },
336
+ "eval_DESC": {
337
+ "f1": 0.29032258064516125,
338
+ "number": 30,
339
+ "precision": 0.28125,
340
+ "recall": 0.3
341
+ },
342
+ "eval_FT": {
343
+ "f1": 0.0,
344
+ "number": 7,
345
+ "precision": 0.0,
346
+ "recall": 0.0
347
+ },
348
+ "eval_LOC": {
349
+ "f1": 0.9593175853018372,
350
+ "number": 761,
351
+ "precision": 0.9580602883355177,
352
+ "recall": 0.9605781865965834
353
+ },
354
+ "eval_PER": {
355
+ "f1": 0.9705014749262537,
356
+ "number": 676,
357
+ "precision": 0.9676470588235294,
358
+ "recall": 0.9733727810650887
359
+ },
360
+ "eval_SPAT": {
361
+ "f1": 0.9548387096774194,
362
+ "number": 694,
363
+ "precision": 0.9500713266761769,
364
+ "recall": 0.9596541786743515
365
+ },
366
+ "eval_TITRE": {
367
+ "f1": 0.0,
368
+ "number": 2,
369
+ "precision": 0.0,
370
+ "recall": 0.0
371
+ },
372
+ "eval_TITREH": {
373
+ "f1": 0.8615384615384615,
374
+ "number": 33,
375
+ "precision": 0.875,
376
+ "recall": 0.8484848484848485
377
+ },
378
+ "eval_TITREP": {
379
+ "f1": 0.3333333333333333,
380
+ "number": 6,
381
+ "precision": 0.3333333333333333,
382
+ "recall": 0.3333333333333333
383
+ },
384
+ "eval_accuracy": 0.9596304732978993,
385
+ "eval_accuracy-all": 0.9715894710199949,
386
+ "eval_accuracy-das": 0.9746899519109087,
387
+ "eval_accuracy-l1": 0.9644393824348266,
388
+ "eval_accuracy-l2": 0.9787395596051632,
389
+ "eval_f1": 0.9591067285382832,
390
+ "eval_f1-all": 0.9536210680321872,
391
+ "eval_f1-das": 0.9631970260223048,
392
+ "eval_f1-l1": 0.9477786438035852,
393
+ "eval_f1-l2": 0.9611520428667114,
394
+ "eval_loss": 0.16297389566898346,
395
+ "eval_precision": 0.9568865740740741,
396
+ "eval_precision-all": 0.9504228638086906,
397
+ "eval_precision-das": 0.9614100185528757,
398
+ "eval_precision-l1": 0.9382716049382716,
399
+ "eval_precision-l2": 0.9663299663299664,
400
+ "eval_recall": 0.9613372093023256,
401
+ "eval_recall-all": 0.9568408690546095,
402
+ "eval_recall-das": 0.9649906890130354,
403
+ "eval_recall-l1": 0.9574803149606299,
404
+ "eval_recall-l2": 0.9560293137908061,
405
+ "eval_runtime": 5.7026,
406
+ "eval_samples_per_second": 118.543,
407
+ "eval_steps_per_second": 7.54,
408
+ "step": 400
409
+ },
410
+ {
411
+ "epoch": 1.31,
412
+ "learning_rate": 9e-05,
413
+ "loss": 0.3757,
414
+ "step": 500
415
+ },
416
+ {
417
+ "epoch": 1.31,
418
+ "eval_ACT": {
419
+ "f1": 0.9391634980988594,
420
+ "number": 519,
421
+ "precision": 0.926829268292683,
422
+ "recall": 0.9518304431599229
423
+ },
424
+ "eval_ACT_L1": {
425
+ "f1": 0.9620253164556961,
426
+ "number": 503,
427
+ "precision": 0.9427480916030534,
428
+ "recall": 0.9821073558648111
429
+ },
430
+ "eval_ACT_L2": {
431
+ "f1": 0.0,
432
+ "number": 16,
433
+ "precision": 0.0,
434
+ "recall": 0.0
435
+ },
436
+ "eval_CARDINAL": {
437
+ "f1": 0.9882005899705014,
438
+ "number": 678,
439
+ "precision": 0.9882005899705014,
440
+ "recall": 0.9882005899705014
441
+ },
442
+ "eval_DESC": {
443
+ "f1": 0.4210526315789474,
444
+ "number": 30,
445
+ "precision": 0.4444444444444444,
446
+ "recall": 0.4
447
+ },
448
+ "eval_FT": {
449
+ "f1": 0.0,
450
+ "number": 7,
451
+ "precision": 0.0,
452
+ "recall": 0.0
453
+ },
454
+ "eval_LOC": {
455
+ "f1": 0.9538061158100194,
456
+ "number": 761,
457
+ "precision": 0.9445876288659794,
458
+ "recall": 0.9632063074901446
459
+ },
460
+ "eval_PER": {
461
+ "f1": 0.9668386145910095,
462
+ "number": 676,
463
+ "precision": 0.9632892804698973,
464
+ "recall": 0.9704142011834319
465
+ },
466
+ "eval_SPAT": {
467
+ "f1": 0.9591397849462366,
468
+ "number": 694,
469
+ "precision": 0.9543509272467903,
470
+ "recall": 0.9639769452449568
471
+ },
472
+ "eval_TITRE": {
473
+ "f1": 0.0,
474
+ "number": 2,
475
+ "precision": 0.0,
476
+ "recall": 0.0
477
+ },
478
+ "eval_TITREH": {
479
+ "f1": 0.8253968253968254,
480
+ "number": 33,
481
+ "precision": 0.8666666666666667,
482
+ "recall": 0.7878787878787878
483
+ },
484
+ "eval_TITREP": {
485
+ "f1": 0.30769230769230765,
486
+ "number": 6,
487
+ "precision": 0.2857142857142857,
488
+ "recall": 0.3333333333333333
489
+ },
490
+ "eval_accuracy": 0.9562136168058719,
491
+ "eval_accuracy-all": 0.9681093394077449,
492
+ "eval_accuracy-das": 0.9724120475828905,
493
+ "eval_accuracy-l1": 0.9627942293090357,
494
+ "eval_accuracy-l2": 0.973424449506454,
495
+ "eval_f1": 0.9563205091119468,
496
+ "eval_f1-all": 0.9539406345957011,
497
+ "eval_f1-das": 0.9595847237671488,
498
+ "eval_f1-l1": 0.9541427826993225,
499
+ "eval_f1-l2": 0.9536821059646784,
500
+ "eval_loss": 0.16671402752399445,
501
+ "eval_precision": 0.9516407599309153,
502
+ "eval_precision-all": 0.9501893387707544,
503
+ "eval_precision-das": 0.9553340716131414,
504
+ "eval_precision-l1": 0.9472322814278323,
505
+ "eval_precision-l2": 0.954,
506
+ "eval_recall": 0.961046511627907,
507
+ "eval_recall-all": 0.9577216676453317,
508
+ "eval_recall-das": 0.9638733705772812,
509
+ "eval_recall-l1": 0.9611548556430446,
510
+ "eval_recall-l2": 0.9533644237175216,
511
+ "eval_runtime": 5.8183,
512
+ "eval_samples_per_second": 116.184,
513
+ "eval_steps_per_second": 7.39,
514
+ "step": 500
515
+ },
516
+ {
517
+ "epoch": 1.57,
518
+ "eval_ACT": {
519
+ "f1": 0.9446564885496184,
520
+ "number": 519,
521
+ "precision": 0.9357277882797732,
522
+ "recall": 0.953757225433526
523
+ },
524
+ "eval_ACT_L1": {
525
+ "f1": 0.962962962962963,
526
+ "number": 503,
527
+ "precision": 0.9445506692160612,
528
+ "recall": 0.9821073558648111
529
+ },
530
+ "eval_ACT_L2": {
531
+ "f1": 0.09090909090909091,
532
+ "number": 16,
533
+ "precision": 0.16666666666666666,
534
+ "recall": 0.0625
535
+ },
536
+ "eval_CARDINAL": {
537
+ "f1": 0.9845474613686535,
538
+ "number": 678,
539
+ "precision": 0.9823788546255506,
540
+ "recall": 0.9867256637168141
541
+ },
542
+ "eval_DESC": {
543
+ "f1": 0.4126984126984127,
544
+ "number": 30,
545
+ "precision": 0.3939393939393939,
546
+ "recall": 0.43333333333333335
547
+ },
548
+ "eval_FT": {
549
+ "f1": 0.2,
550
+ "number": 7,
551
+ "precision": 0.3333333333333333,
552
+ "recall": 0.14285714285714285
553
+ },
554
+ "eval_LOC": {
555
+ "f1": 0.9621409921671019,
556
+ "number": 761,
557
+ "precision": 0.9559014267185474,
558
+ "recall": 0.9684625492772667
559
+ },
560
+ "eval_PER": {
561
+ "f1": 0.9556213017751479,
562
+ "number": 676,
563
+ "precision": 0.9556213017751479,
564
+ "recall": 0.9556213017751479
565
+ },
566
+ "eval_SPAT": {
567
+ "f1": 0.9648745519713262,
568
+ "number": 694,
569
+ "precision": 0.9600570613409415,
570
+ "recall": 0.9697406340057637
571
+ },
572
+ "eval_TITRE": {
573
+ "f1": 0.0,
574
+ "number": 2,
575
+ "precision": 0.0,
576
+ "recall": 0.0
577
+ },
578
+ "eval_TITREH": {
579
+ "f1": 0.5,
580
+ "number": 33,
581
+ "precision": 0.4857142857142857,
582
+ "recall": 0.5151515151515151
583
+ },
584
+ "eval_TITREP": {
585
+ "f1": 0.3333333333333333,
586
+ "number": 6,
587
+ "precision": 0.3333333333333333,
588
+ "recall": 0.3333333333333333
589
+ },
590
+ "eval_accuracy": 0.9612756264236902,
591
+ "eval_accuracy-all": 0.9720323968615541,
592
+ "eval_accuracy-das": 0.9725385978233358,
593
+ "eval_accuracy-l1": 0.9681093394077449,
594
+ "eval_accuracy-l2": 0.9759554543153632,
595
+ "eval_f1": 0.9551374819102749,
596
+ "eval_f1-all": 0.951030551089022,
597
+ "eval_f1-das": 0.9584415584415584,
598
+ "eval_f1-l1": 0.9515372589890569,
599
+ "eval_f1-l2": 0.9503829503829505,
600
+ "eval_loss": 0.16416500508785248,
601
+ "eval_precision": 0.9510086455331412,
602
+ "eval_precision-all": 0.9470160116448326,
603
+ "eval_precision-das": 0.9548983364140481,
604
+ "eval_precision-l1": 0.9446456285566477,
605
+ "eval_precision-l2": 0.9500665778961385,
606
+ "eval_recall": 0.9593023255813954,
607
+ "eval_recall-all": 0.955079271873165,
608
+ "eval_recall-das": 0.9620111731843576,
609
+ "eval_recall-l1": 0.9585301837270341,
610
+ "eval_recall-l2": 0.9506995336442372,
611
+ "eval_runtime": 5.484,
612
+ "eval_samples_per_second": 123.267,
613
+ "eval_steps_per_second": 7.841,
614
+ "step": 600
615
+ },
616
+ {
617
+ "epoch": 1.84,
618
+ "eval_ACT": {
619
+ "f1": 0.9315589353612168,
620
+ "number": 519,
621
+ "precision": 0.9193245778611632,
622
+ "recall": 0.9441233140655106
623
+ },
624
+ "eval_ACT_L1": {
625
+ "f1": 0.9494163424124514,
626
+ "number": 503,
627
+ "precision": 0.9295238095238095,
628
+ "recall": 0.9701789264413518
629
+ },
630
+ "eval_ACT_L2": {
631
+ "f1": 0.16666666666666666,
632
+ "number": 16,
633
+ "precision": 0.25,
634
+ "recall": 0.125
635
+ },
636
+ "eval_CARDINAL": {
637
+ "f1": 0.9882352941176471,
638
+ "number": 678,
639
+ "precision": 0.9853372434017595,
640
+ "recall": 0.9911504424778761
641
+ },
642
+ "eval_DESC": {
643
+ "f1": 0.37142857142857144,
644
+ "number": 30,
645
+ "precision": 0.325,
646
+ "recall": 0.43333333333333335
647
+ },
648
+ "eval_FT": {
649
+ "f1": 0.22222222222222224,
650
+ "number": 7,
651
+ "precision": 0.5,
652
+ "recall": 0.14285714285714285
653
+ },
654
+ "eval_LOC": {
655
+ "f1": 0.9505851755526659,
656
+ "number": 761,
657
+ "precision": 0.9407979407979408,
658
+ "recall": 0.9605781865965834
659
+ },
660
+ "eval_PER": {
661
+ "f1": 0.9652623798965262,
662
+ "number": 676,
663
+ "precision": 0.9645494830132939,
664
+ "recall": 0.9659763313609467
665
+ },
666
+ "eval_SPAT": {
667
+ "f1": 0.9691756272401433,
668
+ "number": 694,
669
+ "precision": 0.9643366619115549,
670
+ "recall": 0.9740634005763689
671
+ },
672
+ "eval_TITRE": {
673
+ "f1": 0.0,
674
+ "number": 2,
675
+ "precision": 0.0,
676
+ "recall": 0.0
677
+ },
678
+ "eval_TITREH": {
679
+ "f1": 0.7536231884057971,
680
+ "number": 33,
681
+ "precision": 0.7222222222222222,
682
+ "recall": 0.7878787878787878
683
+ },
684
+ "eval_TITREP": {
685
+ "f1": 0.5454545454545454,
686
+ "number": 6,
687
+ "precision": 0.6,
688
+ "recall": 0.5
689
+ },
690
+ "eval_accuracy": 0.9586180713743356,
691
+ "eval_accuracy-all": 0.9714629207795494,
692
+ "eval_accuracy-das": 0.9693748418121995,
693
+ "eval_accuracy-l1": 0.9659579853201721,
694
+ "eval_accuracy-l2": 0.9769678562389269,
695
+ "eval_f1": 0.953810623556582,
696
+ "eval_f1-all": 0.95203382417262,
697
+ "eval_f1-das": 0.9564734210038897,
698
+ "eval_f1-l1": 0.9511434511434511,
699
+ "eval_f1-l2": 0.9531717037529059,
700
+ "eval_loss": 0.14926117658615112,
701
+ "eval_precision": 0.9472477064220184,
702
+ "eval_precision-all": 0.9455545902114104,
703
+ "eval_precision-das": 0.9513633014001474,
704
+ "eval_precision-l1": 0.9418425115800309,
705
+ "eval_precision-l2": 0.9503311258278145,
706
+ "eval_recall": 0.9604651162790697,
707
+ "eval_recall-all": 0.958602466236054,
708
+ "eval_recall-das": 0.9616387337057728,
709
+ "eval_recall-l1": 0.9606299212598425,
710
+ "eval_recall-l2": 0.9560293137908061,
711
+ "eval_runtime": 5.4819,
712
+ "eval_samples_per_second": 123.315,
713
+ "eval_steps_per_second": 7.844,
714
+ "step": 700
715
+ },
716
+ {
717
+ "epoch": 2.1,
718
+ "eval_ACT": {
719
+ "f1": 0.9513822688274547,
720
+ "number": 519,
721
+ "precision": 0.9415094339622642,
722
+ "recall": 0.9614643545279383
723
+ },
724
+ "eval_ACT_L1": {
725
+ "f1": 0.9753208292201382,
726
+ "number": 503,
727
+ "precision": 0.9686274509803922,
728
+ "recall": 0.9821073558648111
729
+ },
730
+ "eval_ACT_L2": {
731
+ "f1": 0.2777777777777778,
732
+ "number": 16,
733
+ "precision": 0.25,
734
+ "recall": 0.3125
735
+ },
736
+ "eval_CARDINAL": {
737
+ "f1": 0.9838235294117647,
738
+ "number": 678,
739
+ "precision": 0.9809384164222874,
740
+ "recall": 0.9867256637168141
741
+ },
742
+ "eval_DESC": {
743
+ "f1": 0.41666666666666663,
744
+ "number": 30,
745
+ "precision": 0.35714285714285715,
746
+ "recall": 0.5
747
+ },
748
+ "eval_FT": {
749
+ "f1": 0.2,
750
+ "number": 7,
751
+ "precision": 0.3333333333333333,
752
+ "recall": 0.14285714285714285
753
+ },
754
+ "eval_LOC": {
755
+ "f1": 0.9544270833333334,
756
+ "number": 761,
757
+ "precision": 0.9458064516129032,
758
+ "recall": 0.9632063074901446
759
+ },
760
+ "eval_PER": {
761
+ "f1": 0.9748892171344165,
762
+ "number": 676,
763
+ "precision": 0.9734513274336283,
764
+ "recall": 0.9763313609467456
765
+ },
766
+ "eval_SPAT": {
767
+ "f1": 0.9569583931133429,
768
+ "number": 694,
769
+ "precision": 0.9528571428571428,
770
+ "recall": 0.9610951008645533
771
+ },
772
+ "eval_TITRE": {
773
+ "f1": 0.0,
774
+ "number": 2,
775
+ "precision": 0.0,
776
+ "recall": 0.0
777
+ },
778
+ "eval_TITREH": {
779
+ "f1": 0.7761194029850745,
780
+ "number": 33,
781
+ "precision": 0.7647058823529411,
782
+ "recall": 0.7878787878787878
783
+ },
784
+ "eval_TITREP": {
785
+ "f1": 0.3636363636363636,
786
+ "number": 6,
787
+ "precision": 0.4,
788
+ "recall": 0.3333333333333333
789
+ },
790
+ "eval_accuracy": 0.9616552771450265,
791
+ "eval_accuracy-all": 0.9710832700582132,
792
+ "eval_accuracy-das": 0.9773475069602632,
793
+ "eval_accuracy-l1": 0.9678562389268539,
794
+ "eval_accuracy-l2": 0.9743103011895723,
795
+ "eval_f1": 0.9578886645514854,
796
+ "eval_f1-all": 0.9546316557257476,
797
+ "eval_f1-das": 0.96274328081557,
798
+ "eval_f1-l1": 0.9574967405475882,
799
+ "eval_f1-l2": 0.9509933774834437,
800
+ "eval_loss": 0.13481108844280243,
801
+ "eval_precision": 0.9504865483686319,
802
+ "eval_precision-all": 0.9486807770368223,
803
+ "eval_precision-das": 0.9583025830258303,
804
+ "eval_precision-l1": 0.9512953367875647,
805
+ "eval_precision-l2": 0.945358788676761,
806
+ "eval_recall": 0.9654069767441861,
807
+ "eval_recall-all": 0.9606576629477392,
808
+ "eval_recall-das": 0.9672253258845438,
809
+ "eval_recall-l1": 0.9637795275590552,
810
+ "eval_recall-l2": 0.9566955363091273,
811
+ "eval_runtime": 5.8282,
812
+ "eval_samples_per_second": 115.988,
813
+ "eval_steps_per_second": 7.378,
814
+ "step": 800
815
+ },
816
+ {
817
+ "epoch": 2.36,
818
+ "eval_ACT": {
819
+ "f1": 0.9456625357483317,
820
+ "number": 519,
821
+ "precision": 0.9358490566037736,
822
+ "recall": 0.9556840077071291
823
+ },
824
+ "eval_ACT_L1": {
825
+ "f1": 0.9627450980392156,
826
+ "number": 503,
827
+ "precision": 0.9497098646034816,
828
+ "recall": 0.9761431411530815
829
+ },
830
+ "eval_ACT_L2": {
831
+ "f1": 0.3448275862068966,
832
+ "number": 16,
833
+ "precision": 0.38461538461538464,
834
+ "recall": 0.3125
835
+ },
836
+ "eval_CARDINAL": {
837
+ "f1": 0.9882179675994109,
838
+ "number": 678,
839
+ "precision": 0.986764705882353,
840
+ "recall": 0.9896755162241888
841
+ },
842
+ "eval_DESC": {
843
+ "f1": 0.47761194029850745,
844
+ "number": 30,
845
+ "precision": 0.43243243243243246,
846
+ "recall": 0.5333333333333333
847
+ },
848
+ "eval_FT": {
849
+ "f1": 0.4444444444444445,
850
+ "number": 7,
851
+ "precision": 1.0,
852
+ "recall": 0.2857142857142857
853
+ },
854
+ "eval_LOC": {
855
+ "f1": 0.961311475409836,
856
+ "number": 761,
857
+ "precision": 0.9594240837696335,
858
+ "recall": 0.9632063074901446
859
+ },
860
+ "eval_PER": {
861
+ "f1": 0.9837758112094395,
862
+ "number": 676,
863
+ "precision": 0.9808823529411764,
864
+ "recall": 0.9866863905325444
865
+ },
866
+ "eval_SPAT": {
867
+ "f1": 0.9712230215827338,
868
+ "number": 694,
869
+ "precision": 0.9698275862068966,
870
+ "recall": 0.9726224783861671
871
+ },
872
+ "eval_TITRE": {
873
+ "f1": 0.0,
874
+ "number": 2,
875
+ "precision": 0.0,
876
+ "recall": 0.0
877
+ },
878
+ "eval_TITREH": {
879
+ "f1": 0.9117647058823529,
880
+ "number": 33,
881
+ "precision": 0.8857142857142857,
882
+ "recall": 0.9393939393939394
883
+ },
884
+ "eval_TITREP": {
885
+ "f1": 0.3333333333333333,
886
+ "number": 6,
887
+ "precision": 0.3333333333333333,
888
+ "recall": 0.3333333333333333
889
+ },
890
+ "eval_accuracy": 0.9681093394077449,
891
+ "eval_accuracy-all": 0.9769678562389269,
892
+ "eval_accuracy-das": 0.9791192103264996,
893
+ "eval_accuracy-l1": 0.9740572007086813,
894
+ "eval_accuracy-l2": 0.9798785117691724,
895
+ "eval_f1": 0.9645081848471678,
896
+ "eval_f1-all": 0.9634289057928613,
897
+ "eval_f1-das": 0.9686048671744381,
898
+ "eval_f1-l1": 0.9642764015645371,
899
+ "eval_f1-l2": 0.9623458847050984,
900
+ "eval_loss": 0.13176283240318298,
901
+ "eval_precision": 0.9613052266820675,
902
+ "eval_precision-all": 0.9600583090379009,
903
+ "eval_precision-das": 0.9662713120830244,
904
+ "eval_precision-l1": 0.9580310880829016,
905
+ "eval_precision-l2": 0.9626666666666667,
906
+ "eval_recall": 0.9677325581395348,
907
+ "eval_recall-all": 0.966823253082795,
908
+ "eval_recall-das": 0.9709497206703911,
909
+ "eval_recall-l1": 0.9706036745406824,
910
+ "eval_recall-l2": 0.9620253164556962,
911
+ "eval_runtime": 5.853,
912
+ "eval_samples_per_second": 115.497,
913
+ "eval_steps_per_second": 7.347,
914
+ "step": 900
915
+ },
916
+ {
917
+ "epoch": 2.62,
918
+ "learning_rate": 8e-05,
919
+ "loss": 0.1255,
920
+ "step": 1000
921
+ },
922
+ {
923
+ "epoch": 2.62,
924
+ "eval_ACT": {
925
+ "f1": 0.9449715370018975,
926
+ "number": 519,
927
+ "precision": 0.930841121495327,
928
+ "recall": 0.9595375722543352
929
+ },
930
+ "eval_ACT_L1": {
931
+ "f1": 0.9637610186092068,
932
+ "number": 503,
933
+ "precision": 0.9498069498069498,
934
+ "recall": 0.9781312127236581
935
+ },
936
+ "eval_ACT_L2": {
937
+ "f1": 0.3636363636363636,
938
+ "number": 16,
939
+ "precision": 0.35294117647058826,
940
+ "recall": 0.375
941
+ },
942
+ "eval_CARDINAL": {
943
+ "f1": 0.9896907216494845,
944
+ "number": 678,
945
+ "precision": 0.9882352941176471,
946
+ "recall": 0.9911504424778761
947
+ },
948
+ "eval_DESC": {
949
+ "f1": 0.5205479452054794,
950
+ "number": 30,
951
+ "precision": 0.4418604651162791,
952
+ "recall": 0.6333333333333333
953
+ },
954
+ "eval_FT": {
955
+ "f1": 0.4,
956
+ "number": 7,
957
+ "precision": 0.6666666666666666,
958
+ "recall": 0.2857142857142857
959
+ },
960
+ "eval_LOC": {
961
+ "f1": 0.9639344262295081,
962
+ "number": 761,
963
+ "precision": 0.9620418848167539,
964
+ "recall": 0.9658344283837057
965
+ },
966
+ "eval_PER": {
967
+ "f1": 0.9807692307692307,
968
+ "number": 676,
969
+ "precision": 0.9807692307692307,
970
+ "recall": 0.9807692307692307
971
+ },
972
+ "eval_SPAT": {
973
+ "f1": 0.9676956209619526,
974
+ "number": 694,
975
+ "precision": 0.9642346208869814,
976
+ "recall": 0.9711815561959655
977
+ },
978
+ "eval_TITRE": {
979
+ "f1": 0.0,
980
+ "number": 2,
981
+ "precision": 0.0,
982
+ "recall": 0.0
983
+ },
984
+ "eval_TITREH": {
985
+ "f1": 0.8615384615384615,
986
+ "number": 33,
987
+ "precision": 0.875,
988
+ "recall": 0.8484848484848485
989
+ },
990
+ "eval_TITREP": {
991
+ "f1": 0.3333333333333333,
992
+ "number": 6,
993
+ "precision": 0.3333333333333333,
994
+ "recall": 0.3333333333333333
995
+ },
996
+ "eval_accuracy": 0.9682358896481903,
997
+ "eval_accuracy-all": 0.9760187294355859,
998
+ "eval_accuracy-das": 0.9798785117691724,
999
+ "eval_accuracy-l1": 0.9729182485446722,
1000
+ "eval_accuracy-l2": 0.9791192103264996,
1001
+ "eval_f1": 0.9649173673528558,
1002
+ "eval_f1-all": 0.962302746931619,
1003
+ "eval_f1-das": 0.9680297397769516,
1004
+ "eval_f1-l1": 0.9622494142150483,
1005
+ "eval_f1-l2": 0.9623709623709623,
1006
+ "eval_loss": 0.1248239278793335,
1007
+ "eval_precision": 0.9624060150375939,
1008
+ "eval_precision-all": 0.9578243164630599,
1009
+ "eval_precision-das": 0.9662337662337662,
1010
+ "eval_precision-l1": 0.9545454545454546,
1011
+ "eval_precision-l2": 0.9620505992010653,
1012
+ "eval_recall": 0.9674418604651163,
1013
+ "eval_recall-all": 0.966823253082795,
1014
+ "eval_recall-das": 0.9698324022346368,
1015
+ "eval_recall-l1": 0.9700787401574803,
1016
+ "eval_recall-l2": 0.9626915389740173,
1017
+ "eval_runtime": 5.3948,
1018
+ "eval_samples_per_second": 125.307,
1019
+ "eval_steps_per_second": 7.971,
1020
+ "step": 1000
1021
+ }
1022
+ ],
1023
+ "max_steps": 5000,
1024
+ "num_train_epochs": 14,
1025
+ "total_flos": 408798986982336.0,
1026
+ "trial_name": null,
1027
+ "trial_params": null
1028
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f80e2880b6f530ce65e2922fc7676701918903c26c046655072ee6d45287ded
3
+ size 3503