nlpso commited on
Commit
5cf5142
1 Parent(s): 6a95073

Load model and tokenizer

Browse files
config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Jean-Baptiste/camembert-ner",
3
+ "architectures": [
4
+ "CamembertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 5,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 6,
10
+ "gradient_checkpointing": false,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "O+O",
16
+ "1": "I-PER+O",
17
+ "2": "I-PER+i_TITREH",
18
+ "3": "I-ACT+O",
19
+ "4": "I-DESC+O",
20
+ "5": "I-DESC+i_ACT",
21
+ "6": "I-DESC+i_TITREP",
22
+ "7": "I-SPAT+O",
23
+ "8": "I-SPAT+i_LOC",
24
+ "9": "I-SPAT+i_CARDINAL",
25
+ "10": "I-SPAT+i_FT",
26
+ "11": "I-TITRE+O"
27
+ },
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 3072,
30
+ "label2id": {
31
+ "I-ACT+O": 3,
32
+ "I-DESC+O": 4,
33
+ "I-DESC+i_ACT": 5,
34
+ "I-DESC+i_TITREP": 6,
35
+ "I-PER+O": 1,
36
+ "I-PER+i_TITREH": 2,
37
+ "I-SPAT+O": 7,
38
+ "I-SPAT+i_CARDINAL": 9,
39
+ "I-SPAT+i_FT": 10,
40
+ "I-SPAT+i_LOC": 8,
41
+ "I-TITRE+O": 11,
42
+ "O+O": 0
43
+ },
44
+ "layer_norm_eps": 1e-05,
45
+ "max_position_embeddings": 514,
46
+ "model_type": "camembert",
47
+ "num_attention_heads": 12,
48
+ "num_hidden_layers": 12,
49
+ "output_past": true,
50
+ "pad_token_id": 1,
51
+ "position_embedding_type": "absolute",
52
+ "torch_dtype": "float32",
53
+ "transformers_version": "4.25.1",
54
+ "type_vocab_size": 1,
55
+ "use_cache": true,
56
+ "vocab_size": 32005
57
+ }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4cba482b27702001a3b86475d3b9b72f761286124ff6ce5c1f0c44f8ca7572c
3
+ size 880440037
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7b75eed96c8dcc0bb0c63fa76c8f6db31beab651158b4370fc6bcd3029d8600
3
+ size 440233393
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10e0deb8984910703030ca3f179066fb3f496f3fa4c860d5804407f8c72066f2
3
+ size 14503
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48f2a75f3ed3f16767915866d392dbc6d954dd1374475cfd20580f7c483a9e55
3
+ size 623
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:988bc5a00281c6d210a5d34bd143d0363741a432fefe741bf71e61b1869d4314
3
+ size 810912
special_tokens_map.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": "<mask>",
10
+ "pad_token": "<pad>",
11
+ "sep_token": "</s>",
12
+ "unk_token": "<unk>"
13
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": {
10
+ "__type": "AddedToken",
11
+ "content": "<mask>",
12
+ "lstrip": true,
13
+ "normalized": true,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ "model_max_length": 512,
18
+ "name_or_path": "Jean-Baptiste/camembert-ner",
19
+ "pad_token": "<pad>",
20
+ "sep_token": "</s>",
21
+ "sp_model_kwargs": {},
22
+ "special_tokens_map_file": "/lrde/home2/stual/.cache/huggingface/hub/models--Jean-Baptiste--camembert-ner/snapshots/9f8b2203b6a2daba1ad279ac2adb822518caa167/special_tokens_map.json",
23
+ "tokenizer_class": "CamembertTokenizer",
24
+ "unk_token": "<unk>"
25
+ }
trainer_state.json ADDED
@@ -0,0 +1,1228 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9684392563769997,
3
+ "best_model_checkpoint": "/work/stual/res_ICDAR/method_3/tmp/311-camembert-ner-hierarchical-loss-io/checkpoint-1200",
4
+ "epoch": 3.1496062992125986,
5
+ "global_step": 1200,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.26,
12
+ "eval_ACT": {
13
+ "f1": 0.9010175763182239,
14
+ "number": 519,
15
+ "precision": 0.8665480427046264,
16
+ "recall": 0.9383429672447013
17
+ },
18
+ "eval_ACT_L1": {
19
+ "f1": 0.9145539906103287,
20
+ "number": 503,
21
+ "precision": 0.8665480427046264,
22
+ "recall": 0.9681908548707754
23
+ },
24
+ "eval_ACT_L2": {
25
+ "f1": 0.0,
26
+ "number": 16,
27
+ "precision": 0.0,
28
+ "recall": 0.0
29
+ },
30
+ "eval_CARDINAL": {
31
+ "f1": 0.9911894273127753,
32
+ "number": 678,
33
+ "precision": 0.9868421052631579,
34
+ "recall": 0.995575221238938
35
+ },
36
+ "eval_DESC": {
37
+ "f1": 0.0,
38
+ "number": 30,
39
+ "precision": 0.0,
40
+ "recall": 0.0
41
+ },
42
+ "eval_FT": {
43
+ "f1": 0.0,
44
+ "number": 7,
45
+ "precision": 0.0,
46
+ "recall": 0.0
47
+ },
48
+ "eval_LOC": {
49
+ "f1": 0.9495472186287194,
50
+ "number": 761,
51
+ "precision": 0.935031847133758,
52
+ "recall": 0.9645203679369251
53
+ },
54
+ "eval_PER": {
55
+ "f1": 0.9402214022140221,
56
+ "number": 676,
57
+ "precision": 0.9381443298969072,
58
+ "recall": 0.9423076923076923
59
+ },
60
+ "eval_SPAT": {
61
+ "f1": 0.9390934844192635,
62
+ "number": 694,
63
+ "precision": 0.9233983286908078,
64
+ "recall": 0.9553314121037464
65
+ },
66
+ "eval_TITRE": {
67
+ "f1": 0.0,
68
+ "number": 2,
69
+ "precision": 0.0,
70
+ "recall": 0.0
71
+ },
72
+ "eval_TITREH": {
73
+ "f1": 0.0,
74
+ "number": 33,
75
+ "precision": 0.0,
76
+ "recall": 0.0
77
+ },
78
+ "eval_TITREP": {
79
+ "f1": 0.0,
80
+ "number": 5,
81
+ "precision": 0.0,
82
+ "recall": 0.0
83
+ },
84
+ "eval_accuracy": 0.9394240317775571,
85
+ "eval_accuracy-all": 0.956616186693148,
86
+ "eval_accuracy-das": 0.9525819265143992,
87
+ "eval_accuracy-l1": 0.9433962264150944,
88
+ "eval_accuracy-l2": 0.9698361469712016,
89
+ "eval_f1": 0.9469872537659327,
90
+ "eval_f1-all": 0.9354602663544563,
91
+ "eval_f1-das": 0.9454949944382648,
92
+ "eval_f1-l1": 0.9249482401656315,
93
+ "eval_f1-l2": 0.9491411249578983,
94
+ "eval_loss": 0.33225661516189575,
95
+ "eval_precision": 0.947261663286004,
96
+ "eval_precision-all": 0.9323220536756126,
97
+ "eval_precision-das": 0.940959409594096,
98
+ "eval_precision-l1": 0.9122001020929046,
99
+ "eval_precision-l2": 0.9591558883594282,
100
+ "eval_recall": 0.9467130031856357,
101
+ "eval_recall-all": 0.9386196769456682,
102
+ "eval_recall-das": 0.9500745156482862,
103
+ "eval_recall-l1": 0.9380577427821523,
104
+ "eval_recall-l2": 0.9393333333333334,
105
+ "eval_runtime": 20.7794,
106
+ "eval_samples_per_second": 32.532,
107
+ "eval_steps_per_second": 2.069,
108
+ "step": 100
109
+ },
110
+ {
111
+ "epoch": 0.52,
112
+ "eval_ACT": {
113
+ "f1": 0.9138576779026217,
114
+ "number": 519,
115
+ "precision": 0.8888888888888888,
116
+ "recall": 0.9402697495183044
117
+ },
118
+ "eval_ACT_L1": {
119
+ "f1": 0.9277566539923954,
120
+ "number": 503,
121
+ "precision": 0.8888888888888888,
122
+ "recall": 0.9701789264413518
123
+ },
124
+ "eval_ACT_L2": {
125
+ "f1": 0.0,
126
+ "number": 16,
127
+ "precision": 0.0,
128
+ "recall": 0.0
129
+ },
130
+ "eval_CARDINAL": {
131
+ "f1": 0.9874723655121592,
132
+ "number": 678,
133
+ "precision": 0.9867452135493373,
134
+ "recall": 0.9882005899705014
135
+ },
136
+ "eval_DESC": {
137
+ "f1": 0.2758620689655172,
138
+ "number": 30,
139
+ "precision": 0.2857142857142857,
140
+ "recall": 0.26666666666666666
141
+ },
142
+ "eval_FT": {
143
+ "f1": 0.0,
144
+ "number": 7,
145
+ "precision": 0.0,
146
+ "recall": 0.0
147
+ },
148
+ "eval_LOC": {
149
+ "f1": 0.9415542710340399,
150
+ "number": 761,
151
+ "precision": 0.9208542713567839,
152
+ "recall": 0.9632063074901446
153
+ },
154
+ "eval_PER": {
155
+ "f1": 0.9559471365638766,
156
+ "number": 676,
157
+ "precision": 0.9489795918367347,
158
+ "recall": 0.9630177514792899
159
+ },
160
+ "eval_SPAT": {
161
+ "f1": 0.9455830388692581,
162
+ "number": 694,
163
+ "precision": 0.9278779472954231,
164
+ "recall": 0.9639769452449568
165
+ },
166
+ "eval_TITRE": {
167
+ "f1": 0.0,
168
+ "number": 2,
169
+ "precision": 0.0,
170
+ "recall": 0.0
171
+ },
172
+ "eval_TITREH": {
173
+ "f1": 0.5666666666666667,
174
+ "number": 33,
175
+ "precision": 0.6296296296296297,
176
+ "recall": 0.5151515151515151
177
+ },
178
+ "eval_TITREP": {
179
+ "f1": 0.0,
180
+ "number": 5,
181
+ "precision": 0.0,
182
+ "recall": 0.0
183
+ },
184
+ "eval_accuracy": 0.9484856007944389,
185
+ "eval_accuracy-all": 0.9626986097318768,
186
+ "eval_accuracy-das": 0.9611469712015889,
187
+ "eval_accuracy-l1": 0.9540714995034757,
188
+ "eval_accuracy-l2": 0.9713257199602781,
189
+ "eval_f1": 0.9447711949505092,
190
+ "eval_f1-all": 0.9391960528225222,
191
+ "eval_f1-das": 0.944280442804428,
192
+ "eval_f1-l1": 0.9339161738236049,
193
+ "eval_f1-l2": 0.9460359760159894,
194
+ "eval_loss": 0.24740029871463776,
195
+ "eval_precision": 0.9360432063672541,
196
+ "eval_precision-all": 0.9282845668387837,
197
+ "eval_precision-das": 0.9353070175438597,
198
+ "eval_precision-l1": 0.9153225806451613,
199
+ "eval_precision-l2": 0.9454061251664447,
200
+ "eval_recall": 0.9536634810309875,
201
+ "eval_recall-all": 0.950367107195301,
202
+ "eval_recall-das": 0.9534277198211625,
203
+ "eval_recall-l1": 0.9532808398950131,
204
+ "eval_recall-l2": 0.9466666666666667,
205
+ "eval_runtime": 8.6217,
206
+ "eval_samples_per_second": 78.406,
207
+ "eval_steps_per_second": 4.987,
208
+ "step": 200
209
+ },
210
+ {
211
+ "epoch": 0.79,
212
+ "eval_ACT": {
213
+ "f1": 0.9371428571428572,
214
+ "number": 519,
215
+ "precision": 0.9265536723163842,
216
+ "recall": 0.9479768786127167
217
+ },
218
+ "eval_ACT_L1": {
219
+ "f1": 0.9516441005802708,
220
+ "number": 503,
221
+ "precision": 0.9265536723163842,
222
+ "recall": 0.9781312127236581
223
+ },
224
+ "eval_ACT_L2": {
225
+ "f1": 0.0,
226
+ "number": 16,
227
+ "precision": 0.0,
228
+ "recall": 0.0
229
+ },
230
+ "eval_CARDINAL": {
231
+ "f1": 0.9904481998530492,
232
+ "number": 678,
233
+ "precision": 0.986822840409956,
234
+ "recall": 0.9941002949852508
235
+ },
236
+ "eval_DESC": {
237
+ "f1": 0.2962962962962963,
238
+ "number": 30,
239
+ "precision": 0.3333333333333333,
240
+ "recall": 0.26666666666666666
241
+ },
242
+ "eval_FT": {
243
+ "f1": 0.0,
244
+ "number": 7,
245
+ "precision": 0.0,
246
+ "recall": 0.0
247
+ },
248
+ "eval_LOC": {
249
+ "f1": 0.9492187500000001,
250
+ "number": 761,
251
+ "precision": 0.9406451612903226,
252
+ "recall": 0.9579500657030223
253
+ },
254
+ "eval_PER": {
255
+ "f1": 0.9800443458980044,
256
+ "number": 676,
257
+ "precision": 0.9793205317577548,
258
+ "recall": 0.9807692307692307
259
+ },
260
+ "eval_SPAT": {
261
+ "f1": 0.9494661921708185,
262
+ "number": 694,
263
+ "precision": 0.9381153305203939,
264
+ "recall": 0.9610951008645533
265
+ },
266
+ "eval_TITRE": {
267
+ "f1": 0.0,
268
+ "number": 2,
269
+ "precision": 0.0,
270
+ "recall": 0.0
271
+ },
272
+ "eval_TITREH": {
273
+ "f1": 0.8615384615384615,
274
+ "number": 33,
275
+ "precision": 0.875,
276
+ "recall": 0.8484848484848485
277
+ },
278
+ "eval_TITREP": {
279
+ "f1": 0.0,
280
+ "number": 5,
281
+ "precision": 0.0,
282
+ "recall": 0.0
283
+ },
284
+ "eval_accuracy": 0.9577954319761668,
285
+ "eval_accuracy-all": 0.9672293942403177,
286
+ "eval_accuracy-das": 0.9703326713008937,
287
+ "eval_accuracy-l1": 0.961643495531281,
288
+ "eval_accuracy-l2": 0.9728152929493545,
289
+ "eval_f1": 0.9603587962962964,
290
+ "eval_f1-all": 0.9537876572097104,
291
+ "eval_f1-das": 0.9622886866059818,
292
+ "eval_f1-l1": 0.9511434511434511,
293
+ "eval_f1-l2": 0.957190635451505,
294
+ "eval_loss": 0.20228183269500732,
295
+ "eval_precision": 0.9595258745302111,
296
+ "eval_precision-all": 0.9498980483542091,
297
+ "eval_precision-das": 0.9596146721007781,
298
+ "eval_precision-l1": 0.9418425115800309,
299
+ "eval_precision-l2": 0.9604026845637584,
300
+ "eval_recall": 0.9611931653634521,
301
+ "eval_recall-all": 0.9577092511013215,
302
+ "eval_recall-das": 0.9649776453055141,
303
+ "eval_recall-l1": 0.9606299212598425,
304
+ "eval_recall-l2": 0.954,
305
+ "eval_runtime": 13.7481,
306
+ "eval_samples_per_second": 49.17,
307
+ "eval_steps_per_second": 3.128,
308
+ "step": 300
309
+ },
310
+ {
311
+ "epoch": 1.05,
312
+ "eval_ACT": {
313
+ "f1": 0.9320574162679425,
314
+ "number": 519,
315
+ "precision": 0.9258555133079848,
316
+ "recall": 0.9383429672447013
317
+ },
318
+ "eval_ACT_L1": {
319
+ "f1": 0.9530332681017614,
320
+ "number": 503,
321
+ "precision": 0.9383429672447013,
322
+ "recall": 0.9681908548707754
323
+ },
324
+ "eval_ACT_L2": {
325
+ "f1": 0.0,
326
+ "number": 16,
327
+ "precision": 0.0,
328
+ "recall": 0.0
329
+ },
330
+ "eval_CARDINAL": {
331
+ "f1": 0.9926470588235294,
332
+ "number": 678,
333
+ "precision": 0.9897360703812317,
334
+ "recall": 0.995575221238938
335
+ },
336
+ "eval_DESC": {
337
+ "f1": 0.18750000000000003,
338
+ "number": 30,
339
+ "precision": 0.17647058823529413,
340
+ "recall": 0.2
341
+ },
342
+ "eval_FT": {
343
+ "f1": 0.0,
344
+ "number": 7,
345
+ "precision": 0.0,
346
+ "recall": 0.0
347
+ },
348
+ "eval_LOC": {
349
+ "f1": 0.9535036018336608,
350
+ "number": 761,
351
+ "precision": 0.9503916449086162,
352
+ "recall": 0.9566360052562418
353
+ },
354
+ "eval_PER": {
355
+ "f1": 0.967032967032967,
356
+ "number": 676,
357
+ "precision": 0.9579100145137881,
358
+ "recall": 0.9763313609467456
359
+ },
360
+ "eval_SPAT": {
361
+ "f1": 0.9663564781675018,
362
+ "number": 694,
363
+ "precision": 0.9601706970128022,
364
+ "recall": 0.9726224783861671
365
+ },
366
+ "eval_TITRE": {
367
+ "f1": 0.0,
368
+ "number": 2,
369
+ "precision": 0.0,
370
+ "recall": 0.0
371
+ },
372
+ "eval_TITREH": {
373
+ "f1": 0.927536231884058,
374
+ "number": 33,
375
+ "precision": 0.8888888888888888,
376
+ "recall": 0.9696969696969697
377
+ },
378
+ "eval_TITREP": {
379
+ "f1": 0.0,
380
+ "number": 5,
381
+ "precision": 0.0,
382
+ "recall": 0.0
383
+ },
384
+ "eval_accuracy": 0.9505958291956306,
385
+ "eval_accuracy-all": 0.9659260178748759,
386
+ "eval_accuracy-das": 0.9659880834160874,
387
+ "eval_accuracy-l1": 0.9558093346573983,
388
+ "eval_accuracy-l2": 0.9760427010923535,
389
+ "eval_f1": 0.955606803113289,
390
+ "eval_f1-all": 0.9539541002777371,
391
+ "eval_f1-das": 0.9637613826426314,
392
+ "eval_f1-l1": 0.9496103896103896,
393
+ "eval_f1-l2": 0.9595453025743899,
394
+ "eval_loss": 0.16856572031974792,
395
+ "eval_precision": 0.9512195121951219,
396
+ "eval_precision-all": 0.94965075669383,
397
+ "eval_precision-das": 0.9614386355209492,
398
+ "eval_precision-l1": 0.9398457583547558,
399
+ "eval_precision-l2": 0.9624413145539906,
400
+ "eval_recall": 0.9600347523892268,
401
+ "eval_recall-all": 0.9582966226138032,
402
+ "eval_recall-das": 0.9660953800298062,
403
+ "eval_recall-l1": 0.9595800524934384,
404
+ "eval_recall-l2": 0.9566666666666667,
405
+ "eval_runtime": 11.6651,
406
+ "eval_samples_per_second": 57.951,
407
+ "eval_steps_per_second": 3.686,
408
+ "step": 400
409
+ },
410
+ {
411
+ "epoch": 1.31,
412
+ "learning_rate": 9e-05,
413
+ "loss": 0.3379,
414
+ "step": 500
415
+ },
416
+ {
417
+ "epoch": 1.31,
418
+ "eval_ACT": {
419
+ "f1": 0.9362511893434823,
420
+ "number": 519,
421
+ "precision": 0.924812030075188,
422
+ "recall": 0.9479768786127167
423
+ },
424
+ "eval_ACT_L1": {
425
+ "f1": 0.9616519174041297,
426
+ "number": 503,
427
+ "precision": 0.9513618677042801,
428
+ "recall": 0.9721669980119284
429
+ },
430
+ "eval_ACT_L2": {
431
+ "f1": 0.17647058823529413,
432
+ "number": 16,
433
+ "precision": 0.16666666666666666,
434
+ "recall": 0.1875
435
+ },
436
+ "eval_CARDINAL": {
437
+ "f1": 0.9933774834437086,
438
+ "number": 678,
439
+ "precision": 0.9911894273127754,
440
+ "recall": 0.995575221238938
441
+ },
442
+ "eval_DESC": {
443
+ "f1": 0.3823529411764707,
444
+ "number": 30,
445
+ "precision": 0.34210526315789475,
446
+ "recall": 0.43333333333333335
447
+ },
448
+ "eval_FT": {
449
+ "f1": 0.0,
450
+ "number": 7,
451
+ "precision": 0.0,
452
+ "recall": 0.0
453
+ },
454
+ "eval_LOC": {
455
+ "f1": 0.9488010369410239,
456
+ "number": 761,
457
+ "precision": 0.9360613810741688,
458
+ "recall": 0.961892247043364
459
+ },
460
+ "eval_PER": {
461
+ "f1": 0.9764705882352941,
462
+ "number": 676,
463
+ "precision": 0.9707602339181286,
464
+ "recall": 0.9822485207100592
465
+ },
466
+ "eval_SPAT": {
467
+ "f1": 0.9529914529914529,
468
+ "number": 694,
469
+ "precision": 0.9422535211267605,
470
+ "recall": 0.9639769452449568
471
+ },
472
+ "eval_TITRE": {
473
+ "f1": 0.0,
474
+ "number": 2,
475
+ "precision": 0.0,
476
+ "recall": 0.0
477
+ },
478
+ "eval_TITREH": {
479
+ "f1": 0.7878787878787878,
480
+ "number": 33,
481
+ "precision": 0.7878787878787878,
482
+ "recall": 0.7878787878787878
483
+ },
484
+ "eval_TITREP": {
485
+ "f1": 0.0,
486
+ "number": 5,
487
+ "precision": 0.0,
488
+ "recall": 0.0
489
+ },
490
+ "eval_accuracy": 0.952085402184707,
491
+ "eval_accuracy-all": 0.9604642502482622,
492
+ "eval_accuracy-das": 0.9714498510427011,
493
+ "eval_accuracy-l1": 0.9569265143992055,
494
+ "eval_accuracy-l2": 0.9640019860973188,
495
+ "eval_f1": 0.9596425482848083,
496
+ "eval_f1-all": 0.9529497450837582,
497
+ "eval_f1-das": 0.9628528974739969,
498
+ "eval_f1-l1": 0.9529992209815632,
499
+ "eval_f1-l2": 0.9528865295288654,
500
+ "eval_loss": 0.1725856363773346,
501
+ "eval_precision": 0.9552367288378766,
502
+ "eval_precision-all": 0.9453757225433526,
503
+ "eval_precision-das": 0.96,
504
+ "eval_precision-l1": 0.9429599177800617,
505
+ "eval_precision-l2": 0.9484808454425363,
506
+ "eval_recall": 0.9640891977990154,
507
+ "eval_recall-all": 0.9606461086637298,
508
+ "eval_recall-das": 0.9657228017883756,
509
+ "eval_recall-l1": 0.963254593175853,
510
+ "eval_recall-l2": 0.9573333333333334,
511
+ "eval_runtime": 16.0693,
512
+ "eval_samples_per_second": 42.068,
513
+ "eval_steps_per_second": 2.676,
514
+ "step": 500
515
+ },
516
+ {
517
+ "epoch": 1.57,
518
+ "eval_ACT": {
519
+ "f1": 0.9299242424242424,
520
+ "number": 519,
521
+ "precision": 0.9143389199255121,
522
+ "recall": 0.9460500963391136
523
+ },
524
+ "eval_ACT_L1": {
525
+ "f1": 0.949514563106796,
526
+ "number": 503,
527
+ "precision": 0.9278937381404174,
528
+ "recall": 0.9721669980119284
529
+ },
530
+ "eval_ACT_L2": {
531
+ "f1": 0.15384615384615385,
532
+ "number": 16,
533
+ "precision": 0.2,
534
+ "recall": 0.125
535
+ },
536
+ "eval_CARDINAL": {
537
+ "f1": 0.9933774834437086,
538
+ "number": 678,
539
+ "precision": 0.9911894273127754,
540
+ "recall": 0.995575221238938
541
+ },
542
+ "eval_DESC": {
543
+ "f1": 0.3333333333333333,
544
+ "number": 30,
545
+ "precision": 0.3055555555555556,
546
+ "recall": 0.36666666666666664
547
+ },
548
+ "eval_FT": {
549
+ "f1": 0.0,
550
+ "number": 7,
551
+ "precision": 0.0,
552
+ "recall": 0.0
553
+ },
554
+ "eval_LOC": {
555
+ "f1": 0.9640757674722404,
556
+ "number": 761,
557
+ "precision": 0.9584415584415584,
558
+ "recall": 0.9697766097240473
559
+ },
560
+ "eval_PER": {
561
+ "f1": 0.978629329403095,
562
+ "number": 676,
563
+ "precision": 0.9750367107195301,
564
+ "recall": 0.9822485207100592
565
+ },
566
+ "eval_SPAT": {
567
+ "f1": 0.9642346208869814,
568
+ "number": 694,
569
+ "precision": 0.9573863636363636,
570
+ "recall": 0.9711815561959655
571
+ },
572
+ "eval_TITRE": {
573
+ "f1": 0.0,
574
+ "number": 2,
575
+ "precision": 0.0,
576
+ "recall": 0.0
577
+ },
578
+ "eval_TITREH": {
579
+ "f1": 0.8857142857142858,
580
+ "number": 33,
581
+ "precision": 0.8378378378378378,
582
+ "recall": 0.9393939393939394
583
+ },
584
+ "eval_TITREP": {
585
+ "f1": 0.0,
586
+ "number": 5,
587
+ "precision": 0.0,
588
+ "recall": 0.0
589
+ },
590
+ "eval_accuracy": 0.951837140019861,
591
+ "eval_accuracy-all": 0.9630089374379345,
592
+ "eval_accuracy-das": 0.9715739821251241,
593
+ "eval_accuracy-l1": 0.9551886792452831,
594
+ "eval_accuracy-l2": 0.9708291956305859,
595
+ "eval_f1": 0.9633583381419504,
596
+ "eval_f1-all": 0.958692161728215,
597
+ "eval_f1-das": 0.9671431223315389,
598
+ "eval_f1-l1": 0.9540617700493121,
599
+ "eval_f1-l2": 0.9646430953969313,
600
+ "eval_loss": 0.1551111489534378,
601
+ "eval_precision": 0.959758551307847,
602
+ "eval_precision-all": 0.9529889727219966,
603
+ "eval_precision-das": 0.9637439881613022,
604
+ "eval_precision-l1": 0.9435318275154004,
605
+ "eval_precision-l2": 0.965287049399199,
606
+ "eval_recall": 0.9669852302345786,
607
+ "eval_recall-all": 0.9644640234948605,
608
+ "eval_recall-das": 0.9705663189269746,
609
+ "eval_recall-l1": 0.9648293963254593,
610
+ "eval_recall-l2": 0.964,
611
+ "eval_runtime": 7.6982,
612
+ "eval_samples_per_second": 87.813,
613
+ "eval_steps_per_second": 5.586,
614
+ "step": 600
615
+ },
616
+ {
617
+ "epoch": 1.84,
618
+ "eval_ACT": {
619
+ "f1": 0.9238005644402634,
620
+ "number": 519,
621
+ "precision": 0.9025735294117647,
622
+ "recall": 0.9460500963391136
623
+ },
624
+ "eval_ACT_L1": {
625
+ "f1": 0.9530332681017614,
626
+ "number": 503,
627
+ "precision": 0.9383429672447013,
628
+ "recall": 0.9681908548707754
629
+ },
630
+ "eval_ACT_L2": {
631
+ "f1": 0.19512195121951217,
632
+ "number": 16,
633
+ "precision": 0.16,
634
+ "recall": 0.25
635
+ },
636
+ "eval_CARDINAL": {
637
+ "f1": 0.9941089837997055,
638
+ "number": 678,
639
+ "precision": 0.9926470588235294,
640
+ "recall": 0.995575221238938
641
+ },
642
+ "eval_DESC": {
643
+ "f1": 0.33707865168539325,
644
+ "number": 30,
645
+ "precision": 0.2542372881355932,
646
+ "recall": 0.5
647
+ },
648
+ "eval_FT": {
649
+ "f1": 0.0,
650
+ "number": 7,
651
+ "precision": 0.0,
652
+ "recall": 0.0
653
+ },
654
+ "eval_LOC": {
655
+ "f1": 0.954308093994778,
656
+ "number": 761,
657
+ "precision": 0.9481193255512321,
658
+ "recall": 0.9605781865965834
659
+ },
660
+ "eval_PER": {
661
+ "f1": 0.9807976366322009,
662
+ "number": 676,
663
+ "precision": 0.9793510324483776,
664
+ "recall": 0.9822485207100592
665
+ },
666
+ "eval_SPAT": {
667
+ "f1": 0.9555236728837877,
668
+ "number": 694,
669
+ "precision": 0.9514285714285714,
670
+ "recall": 0.9596541786743515
671
+ },
672
+ "eval_TITRE": {
673
+ "f1": 0.0,
674
+ "number": 2,
675
+ "precision": 0.0,
676
+ "recall": 0.0
677
+ },
678
+ "eval_TITREH": {
679
+ "f1": 0.9411764705882354,
680
+ "number": 33,
681
+ "precision": 0.9142857142857143,
682
+ "recall": 0.9696969696969697
683
+ },
684
+ "eval_TITREP": {
685
+ "f1": 0.0,
686
+ "number": 5,
687
+ "precision": 0.0,
688
+ "recall": 0.0
689
+ },
690
+ "eval_accuracy": 0.9544438927507448,
691
+ "eval_accuracy-all": 0.9669190665342602,
692
+ "eval_accuracy-das": 0.9714498510427011,
693
+ "eval_accuracy-l1": 0.9606504468718967,
694
+ "eval_accuracy-l2": 0.9731876861966237,
695
+ "eval_f1": 0.9572330654420207,
696
+ "eval_f1-all": 0.9528521536670547,
697
+ "eval_f1-das": 0.9665551839464882,
698
+ "eval_f1-l1": 0.948976948976949,
699
+ "eval_f1-l2": 0.9578213218199934,
700
+ "eval_loss": 0.14552079141139984,
701
+ "eval_precision": 0.9487908961593172,
702
+ "eval_precision-all": 0.944332275742717,
703
+ "eval_precision-das": 0.964047442550037,
704
+ "eval_precision-l1": 0.9366053169734151,
705
+ "eval_precision-l2": 0.9543348775645268,
706
+ "eval_recall": 0.9658268172603534,
707
+ "eval_recall-all": 0.9615271659324522,
708
+ "eval_recall-das": 0.9690760059612519,
709
+ "eval_recall-l1": 0.9616797900262467,
710
+ "eval_recall-l2": 0.9613333333333334,
711
+ "eval_runtime": 13.1454,
712
+ "eval_samples_per_second": 51.425,
713
+ "eval_steps_per_second": 3.271,
714
+ "step": 700
715
+ },
716
+ {
717
+ "epoch": 2.1,
718
+ "eval_ACT": {
719
+ "f1": 0.9493791786055396,
720
+ "number": 519,
721
+ "precision": 0.9412878787878788,
722
+ "recall": 0.9576107899807321
723
+ },
724
+ "eval_ACT_L1": {
725
+ "f1": 0.9760956175298805,
726
+ "number": 503,
727
+ "precision": 0.9780439121756487,
728
+ "recall": 0.974155069582505
729
+ },
730
+ "eval_ACT_L2": {
731
+ "f1": 0.3255813953488372,
732
+ "number": 16,
733
+ "precision": 0.25925925925925924,
734
+ "recall": 0.4375
735
+ },
736
+ "eval_CARDINAL": {
737
+ "f1": 0.9933677229182019,
738
+ "number": 678,
739
+ "precision": 0.9926362297496318,
740
+ "recall": 0.9941002949852508
741
+ },
742
+ "eval_DESC": {
743
+ "f1": 0.45569620253164556,
744
+ "number": 30,
745
+ "precision": 0.3673469387755102,
746
+ "recall": 0.6
747
+ },
748
+ "eval_FT": {
749
+ "f1": 0.0,
750
+ "number": 7,
751
+ "precision": 0.0,
752
+ "recall": 0.0
753
+ },
754
+ "eval_LOC": {
755
+ "f1": 0.9652002626395274,
756
+ "number": 761,
757
+ "precision": 0.9645669291338582,
758
+ "recall": 0.9658344283837057
759
+ },
760
+ "eval_PER": {
761
+ "f1": 0.9830258302583026,
762
+ "number": 676,
763
+ "precision": 0.9808541973490427,
764
+ "recall": 0.985207100591716
765
+ },
766
+ "eval_SPAT": {
767
+ "f1": 0.9676956209619526,
768
+ "number": 694,
769
+ "precision": 0.9642346208869814,
770
+ "recall": 0.9711815561959655
771
+ },
772
+ "eval_TITRE": {
773
+ "f1": 0.0,
774
+ "number": 2,
775
+ "precision": 0.0,
776
+ "recall": 0.0
777
+ },
778
+ "eval_TITREH": {
779
+ "f1": 0.8985507246376813,
780
+ "number": 33,
781
+ "precision": 0.8611111111111112,
782
+ "recall": 0.9393939393939394
783
+ },
784
+ "eval_TITREP": {
785
+ "f1": 0.3636363636363636,
786
+ "number": 5,
787
+ "precision": 0.3333333333333333,
788
+ "recall": 0.4
789
+ },
790
+ "eval_accuracy": 0.9563058589870904,
791
+ "eval_accuracy-all": 0.9666708043694141,
792
+ "eval_accuracy-das": 0.9784011916583912,
793
+ "eval_accuracy-l1": 0.9617676266137041,
794
+ "eval_accuracy-l2": 0.9715739821251241,
795
+ "eval_f1": 0.965945165945166,
796
+ "eval_f1-all": 0.9636124506795265,
797
+ "eval_f1-das": 0.9720878302940081,
798
+ "eval_f1-l1": 0.9642577615444821,
799
+ "eval_f1-l2": 0.9627906976744186,
800
+ "eval_loss": 0.14274396002292633,
801
+ "eval_precision": 0.9626114466494105,
802
+ "eval_precision-all": 0.9589877835951134,
803
+ "eval_precision-das": 0.971003717472119,
804
+ "eval_precision-l1": 0.9585062240663901,
805
+ "eval_precision-l2": 0.9596026490066225,
806
+ "eval_recall": 0.9693020561830292,
807
+ "eval_recall-all": 0.9682819383259912,
808
+ "eval_recall-das": 0.9731743666169895,
809
+ "eval_recall-l1": 0.9700787401574803,
810
+ "eval_recall-l2": 0.966,
811
+ "eval_runtime": 32.3788,
812
+ "eval_samples_per_second": 20.878,
813
+ "eval_steps_per_second": 1.328,
814
+ "step": 800
815
+ },
816
+ {
817
+ "epoch": 2.36,
818
+ "eval_ACT": {
819
+ "f1": 0.9467680608365019,
820
+ "number": 519,
821
+ "precision": 0.9343339587242027,
822
+ "recall": 0.9595375722543352
823
+ },
824
+ "eval_ACT_L1": {
825
+ "f1": 0.9693372898120672,
826
+ "number": 503,
827
+ "precision": 0.9645669291338582,
828
+ "recall": 0.974155069582505
829
+ },
830
+ "eval_ACT_L2": {
831
+ "f1": 0.39024390243902435,
832
+ "number": 16,
833
+ "precision": 0.32,
834
+ "recall": 0.5
835
+ },
836
+ "eval_CARDINAL": {
837
+ "f1": 0.9933774834437086,
838
+ "number": 678,
839
+ "precision": 0.9911894273127754,
840
+ "recall": 0.995575221238938
841
+ },
842
+ "eval_DESC": {
843
+ "f1": 0.5333333333333333,
844
+ "number": 30,
845
+ "precision": 0.4444444444444444,
846
+ "recall": 0.6666666666666666
847
+ },
848
+ "eval_FT": {
849
+ "f1": 0.0,
850
+ "number": 7,
851
+ "precision": 0.0,
852
+ "recall": 0.0
853
+ },
854
+ "eval_LOC": {
855
+ "f1": 0.953063885267275,
856
+ "number": 761,
857
+ "precision": 0.9456662354463131,
858
+ "recall": 0.9605781865965834
859
+ },
860
+ "eval_PER": {
861
+ "f1": 0.9918699186991871,
862
+ "number": 676,
863
+ "precision": 0.9911373707533235,
864
+ "recall": 0.992603550295858
865
+ },
866
+ "eval_SPAT": {
867
+ "f1": 0.9627507163323783,
868
+ "number": 694,
869
+ "precision": 0.9572649572649573,
870
+ "recall": 0.968299711815562
871
+ },
872
+ "eval_TITRE": {
873
+ "f1": 0.0,
874
+ "number": 2,
875
+ "precision": 0.0,
876
+ "recall": 0.0
877
+ },
878
+ "eval_TITREH": {
879
+ "f1": 0.9411764705882354,
880
+ "number": 33,
881
+ "precision": 0.9142857142857143,
882
+ "recall": 0.9696969696969697
883
+ },
884
+ "eval_TITREP": {
885
+ "f1": 0.26666666666666666,
886
+ "number": 5,
887
+ "precision": 0.2,
888
+ "recall": 0.4
889
+ },
890
+ "eval_accuracy": 0.958291956305859,
891
+ "eval_accuracy-all": 0.9676017874875869,
892
+ "eval_accuracy-das": 0.9782770605759682,
893
+ "eval_accuracy-l1": 0.9653674280039722,
894
+ "eval_accuracy-l2": 0.9698361469712016,
895
+ "eval_f1": 0.9656065620952655,
896
+ "eval_f1-all": 0.9622504008162076,
897
+ "eval_f1-das": 0.9712377064390424,
898
+ "eval_f1-l1": 0.9658587438102684,
899
+ "eval_f1-l2": 0.9576719576719577,
900
+ "eval_loss": 0.13768324255943298,
901
+ "eval_precision": 0.9596681922196796,
902
+ "eval_precision-all": 0.9551504629629629,
903
+ "eval_precision-das": 0.9674676524953789,
904
+ "eval_precision-l1": 0.9591097308488613,
905
+ "eval_precision-l2": 0.9501312335958005,
906
+ "eval_recall": 0.9716188821314798,
907
+ "eval_recall-all": 0.9694566813509545,
908
+ "eval_recall-das": 0.9750372578241431,
909
+ "eval_recall-l1": 0.9727034120734908,
910
+ "eval_recall-l2": 0.9653333333333334,
911
+ "eval_runtime": 14.3312,
912
+ "eval_samples_per_second": 47.17,
913
+ "eval_steps_per_second": 3.0,
914
+ "step": 900
915
+ },
916
+ {
917
+ "epoch": 2.62,
918
+ "learning_rate": 8e-05,
919
+ "loss": 0.1289,
920
+ "step": 1000
921
+ },
922
+ {
923
+ "epoch": 2.62,
924
+ "eval_ACT": {
925
+ "f1": 0.9370229007633587,
926
+ "number": 519,
927
+ "precision": 0.9281663516068053,
928
+ "recall": 0.9460500963391136
929
+ },
930
+ "eval_ACT_L1": {
931
+ "f1": 0.9640718562874252,
932
+ "number": 503,
933
+ "precision": 0.9679358717434869,
934
+ "recall": 0.9602385685884692
935
+ },
936
+ "eval_ACT_L2": {
937
+ "f1": 0.3478260869565218,
938
+ "number": 16,
939
+ "precision": 0.26666666666666666,
940
+ "recall": 0.5
941
+ },
942
+ "eval_CARDINAL": {
943
+ "f1": 0.9933774834437086,
944
+ "number": 678,
945
+ "precision": 0.9911894273127754,
946
+ "recall": 0.995575221238938
947
+ },
948
+ "eval_DESC": {
949
+ "f1": 0.5063291139240507,
950
+ "number": 30,
951
+ "precision": 0.40816326530612246,
952
+ "recall": 0.6666666666666666
953
+ },
954
+ "eval_FT": {
955
+ "f1": 0.0,
956
+ "number": 7,
957
+ "precision": 0.0,
958
+ "recall": 0.0
959
+ },
960
+ "eval_LOC": {
961
+ "f1": 0.9711286089238845,
962
+ "number": 761,
963
+ "precision": 0.9698558322411533,
964
+ "recall": 0.9724047306176085
965
+ },
966
+ "eval_PER": {
967
+ "f1": 0.9867060561299853,
968
+ "number": 676,
969
+ "precision": 0.9852507374631269,
970
+ "recall": 0.9881656804733728
971
+ },
972
+ "eval_SPAT": {
973
+ "f1": 0.9676956209619526,
974
+ "number": 694,
975
+ "precision": 0.9642346208869814,
976
+ "recall": 0.9711815561959655
977
+ },
978
+ "eval_TITRE": {
979
+ "f1": 0.0,
980
+ "number": 2,
981
+ "precision": 0.0,
982
+ "recall": 0.0
983
+ },
984
+ "eval_TITREH": {
985
+ "f1": 0.9142857142857143,
986
+ "number": 33,
987
+ "precision": 0.8648648648648649,
988
+ "recall": 0.9696969696969697
989
+ },
990
+ "eval_TITREP": {
991
+ "f1": 0.4000000000000001,
992
+ "number": 5,
993
+ "precision": 0.4,
994
+ "recall": 0.4
995
+ },
996
+ "eval_accuracy": 0.9533267130089375,
997
+ "eval_accuracy-all": 0.9641881827209533,
998
+ "eval_accuracy-das": 0.9762909632571996,
999
+ "eval_accuracy-l1": 0.958291956305859,
1000
+ "eval_accuracy-l2": 0.9700844091360477,
1001
+ "eval_f1": 0.9668492360910925,
1002
+ "eval_f1-all": 0.9646508910312591,
1003
+ "eval_f1-das": 0.972470238095238,
1004
+ "eval_f1-l1": 0.9634464751958223,
1005
+ "eval_f1-l2": 0.9661803713527852,
1006
+ "eval_loss": 0.1481187343597412,
1007
+ "eval_precision": 0.9624103299856528,
1008
+ "eval_precision-all": 0.959604766056379,
1009
+ "eval_precision-das": 0.9710252600297177,
1010
+ "eval_precision-l1": 0.9584415584415584,
1011
+ "eval_precision-l2": 0.9610817941952506,
1012
+ "eval_recall": 0.9713292788879235,
1013
+ "eval_recall-all": 0.9697503671071953,
1014
+ "eval_recall-das": 0.973919523099851,
1015
+ "eval_recall-l1": 0.968503937007874,
1016
+ "eval_recall-l2": 0.9713333333333334,
1017
+ "eval_runtime": 20.9824,
1018
+ "eval_samples_per_second": 32.217,
1019
+ "eval_steps_per_second": 2.049,
1020
+ "step": 1000
1021
+ },
1022
+ {
1023
+ "epoch": 2.89,
1024
+ "eval_ACT": {
1025
+ "f1": 0.9523809523809523,
1026
+ "number": 519,
1027
+ "precision": 0.9416195856873822,
1028
+ "recall": 0.9633911368015414
1029
+ },
1030
+ "eval_ACT_L1": {
1031
+ "f1": 0.9713721618953604,
1032
+ "number": 503,
1033
+ "precision": 0.9647058823529412,
1034
+ "recall": 0.9781312127236581
1035
+ },
1036
+ "eval_ACT_L2": {
1037
+ "f1": 0.4324324324324324,
1038
+ "number": 16,
1039
+ "precision": 0.38095238095238093,
1040
+ "recall": 0.5
1041
+ },
1042
+ "eval_CARDINAL": {
1043
+ "f1": 0.9911373707533235,
1044
+ "number": 678,
1045
+ "precision": 0.992603550295858,
1046
+ "recall": 0.9896755162241888
1047
+ },
1048
+ "eval_DESC": {
1049
+ "f1": 0.4864864864864865,
1050
+ "number": 30,
1051
+ "precision": 0.4090909090909091,
1052
+ "recall": 0.6
1053
+ },
1054
+ "eval_FT": {
1055
+ "f1": 0.22222222222222224,
1056
+ "number": 7,
1057
+ "precision": 0.5,
1058
+ "recall": 0.14285714285714285
1059
+ },
1060
+ "eval_LOC": {
1061
+ "f1": 0.9648437500000001,
1062
+ "number": 761,
1063
+ "precision": 0.9561290322580646,
1064
+ "recall": 0.973718791064389
1065
+ },
1066
+ "eval_PER": {
1067
+ "f1": 0.9874353288987435,
1068
+ "number": 676,
1069
+ "precision": 0.9867060561299852,
1070
+ "recall": 0.9881656804733728
1071
+ },
1072
+ "eval_SPAT": {
1073
+ "f1": 0.966113914924297,
1074
+ "number": 694,
1075
+ "precision": 0.9668109668109668,
1076
+ "recall": 0.9654178674351584
1077
+ },
1078
+ "eval_TITRE": {
1079
+ "f1": 0.0,
1080
+ "number": 2,
1081
+ "precision": 0.0,
1082
+ "recall": 0.0
1083
+ },
1084
+ "eval_TITREH": {
1085
+ "f1": 0.9253731343283583,
1086
+ "number": 33,
1087
+ "precision": 0.9117647058823529,
1088
+ "recall": 0.9393939393939394
1089
+ },
1090
+ "eval_TITREP": {
1091
+ "f1": 0.5333333333333333,
1092
+ "number": 5,
1093
+ "precision": 0.4,
1094
+ "recall": 0.8
1095
+ },
1096
+ "eval_accuracy": 0.9617676266137041,
1097
+ "eval_accuracy-all": 0.9718843098311817,
1098
+ "eval_accuracy-das": 0.9786494538232373,
1099
+ "eval_accuracy-l1": 0.9664846077457795,
1100
+ "eval_accuracy-l2": 0.9772840119165839,
1101
+ "eval_f1": 0.9666474985623923,
1102
+ "eval_f1-all": 0.9650942018402219,
1103
+ "eval_f1-das": 0.9727222119131563,
1104
+ "eval_f1-l1": 0.9652650822669104,
1105
+ "eval_f1-l2": 0.9648774022531478,
1106
+ "eval_loss": 0.13178446888923645,
1107
+ "eval_precision": 0.9597487867542107,
1108
+ "eval_precision-all": 0.9599070307960488,
1109
+ "eval_precision-das": 0.9689463955637708,
1110
+ "eval_precision-l1": 0.9604989604989606,
1111
+ "eval_precision-l2": 0.9591567852437418,
1112
+ "eval_recall": 0.9736461048363741,
1113
+ "eval_recall-all": 0.970337738619677,
1114
+ "eval_recall-das": 0.9765275707898659,
1115
+ "eval_recall-l1": 0.9700787401574803,
1116
+ "eval_recall-l2": 0.9706666666666667,
1117
+ "eval_runtime": 21.6072,
1118
+ "eval_samples_per_second": 31.286,
1119
+ "eval_steps_per_second": 1.99,
1120
+ "step": 1100
1121
+ },
1122
+ {
1123
+ "epoch": 3.15,
1124
+ "eval_ACT": {
1125
+ "f1": 0.9504761904761905,
1126
+ "number": 519,
1127
+ "precision": 0.9397363465160076,
1128
+ "recall": 0.9614643545279383
1129
+ },
1130
+ "eval_ACT_L1": {
1131
+ "f1": 0.971201588877855,
1132
+ "number": 503,
1133
+ "precision": 0.9702380952380952,
1134
+ "recall": 0.9721669980119284
1135
+ },
1136
+ "eval_ACT_L2": {
1137
+ "f1": 0.4651162790697674,
1138
+ "number": 16,
1139
+ "precision": 0.37037037037037035,
1140
+ "recall": 0.625
1141
+ },
1142
+ "eval_CARDINAL": {
1143
+ "f1": 0.9926253687315634,
1144
+ "number": 678,
1145
+ "precision": 0.9926253687315634,
1146
+ "recall": 0.9926253687315634
1147
+ },
1148
+ "eval_DESC": {
1149
+ "f1": 0.5263157894736841,
1150
+ "number": 30,
1151
+ "precision": 0.43478260869565216,
1152
+ "recall": 0.6666666666666666
1153
+ },
1154
+ "eval_FT": {
1155
+ "f1": 0.25,
1156
+ "number": 7,
1157
+ "precision": 1.0,
1158
+ "recall": 0.14285714285714285
1159
+ },
1160
+ "eval_LOC": {
1161
+ "f1": 0.9691803278688523,
1162
+ "number": 761,
1163
+ "precision": 0.9672774869109948,
1164
+ "recall": 0.9710906701708278
1165
+ },
1166
+ "eval_PER": {
1167
+ "f1": 0.9852289512555391,
1168
+ "number": 676,
1169
+ "precision": 0.9837758112094396,
1170
+ "recall": 0.9866863905325444
1171
+ },
1172
+ "eval_SPAT": {
1173
+ "f1": 0.9595959595959597,
1174
+ "number": 694,
1175
+ "precision": 0.9609826589595376,
1176
+ "recall": 0.9582132564841499
1177
+ },
1178
+ "eval_TITRE": {
1179
+ "f1": 0.0,
1180
+ "number": 2,
1181
+ "precision": 0.0,
1182
+ "recall": 0.0
1183
+ },
1184
+ "eval_TITREH": {
1185
+ "f1": 0.8985507246376813,
1186
+ "number": 33,
1187
+ "precision": 0.8611111111111112,
1188
+ "recall": 0.9393939393939394
1189
+ },
1190
+ "eval_TITREP": {
1191
+ "f1": 0.4444444444444445,
1192
+ "number": 5,
1193
+ "precision": 0.5,
1194
+ "recall": 0.4
1195
+ },
1196
+ "eval_accuracy": 0.9602780536246276,
1197
+ "eval_accuracy-all": 0.9703326713008937,
1198
+ "eval_accuracy-das": 0.9793942403177756,
1199
+ "eval_accuracy-l1": 0.9651191658391262,
1200
+ "eval_accuracy-l2": 0.9755461767626614,
1201
+ "eval_f1": 0.9684392563769997,
1202
+ "eval_f1-all": 0.9647403072421361,
1203
+ "eval_f1-das": 0.9741395348837208,
1204
+ "eval_f1-l1": 0.9626143790849672,
1205
+ "eval_f1-l2": 0.9674418604651163,
1206
+ "eval_loss": 0.13072313368320465,
1207
+ "eval_precision": 0.963855421686747,
1208
+ "eval_precision-all": 0.9612244897959183,
1209
+ "eval_precision-das": 0.9728725380899294,
1210
+ "eval_precision-l1": 0.9588541666666667,
1211
+ "eval_precision-l2": 0.9642384105960264,
1212
+ "eval_recall": 0.9730668983492615,
1213
+ "eval_recall-all": 0.9682819383259912,
1214
+ "eval_recall-das": 0.9754098360655737,
1215
+ "eval_recall-l1": 0.9664041994750656,
1216
+ "eval_recall-l2": 0.9706666666666667,
1217
+ "eval_runtime": 7.9998,
1218
+ "eval_samples_per_second": 84.502,
1219
+ "eval_steps_per_second": 5.375,
1220
+ "step": 1200
1221
+ }
1222
+ ],
1223
+ "max_steps": 5000,
1224
+ "num_train_epochs": 14,
1225
+ "total_flos": 486860284369728.0,
1226
+ "trial_name": null,
1227
+ "trial_params": null
1228
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6caeb662d58aa9758d6024aa2304c5de8a6dd56a58ec7068fe5cf615acb1dff7
3
+ size 3503