nlpso commited on
Commit
2eec7bc
1 Parent(s): fe7c1e6

Load model and tokenizer

Browse files
config.json ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "HueyNemud/das22-10-camembert_pretrained",
3
+ "architectures": [
4
+ "CamembertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 5,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 6,
10
+ "gradient_checkpointing": false,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "O+O",
16
+ "1": "I-b_PER+O",
17
+ "2": "I-i_PER+O",
18
+ "3": "I-b_PER+b_TITREH",
19
+ "4": "I-i_PER+b_TITREH",
20
+ "5": "I-i_PER+i_TITREH",
21
+ "6": "I-b_ACT+O",
22
+ "7": "I-i_ACT+O",
23
+ "8": "I-b_DESC+O",
24
+ "9": "I-i_DESC+O",
25
+ "10": "I-b_DESC+b_ACT",
26
+ "11": "I-i_DESC+b_ACT",
27
+ "12": "I-i_DESC+i_ACT",
28
+ "13": "I-b_DESC+b_TITREP",
29
+ "14": "I-i_DESC+b_TITREP",
30
+ "15": "I-i_DESC+i_TITREP",
31
+ "16": "I-b_SPAT+O",
32
+ "17": "I-i_SPAT+O",
33
+ "18": "I-b_SPAT+b_LOC",
34
+ "19": "I-i_SPAT+b_LOC",
35
+ "20": "I-i_SPAT+i_LOC",
36
+ "21": "I-b_SPAT+b_CARDINAL",
37
+ "22": "I-i_SPAT+b_CARDINAL",
38
+ "23": "I-i_SPAT+i_CARDINAL",
39
+ "24": "I-b_SPAT+b_FT",
40
+ "25": "I-i_SPAT+b_FT",
41
+ "26": "I-i_SPAT+i_FT",
42
+ "27": "I-b_TITRE+O",
43
+ "28": "I-i_TITRE+O"
44
+ },
45
+ "initializer_range": 0.02,
46
+ "intermediate_size": 3072,
47
+ "label2id": {
48
+ "I-b_ACT+O": 6,
49
+ "I-b_DESC+O": 8,
50
+ "I-b_DESC+b_ACT": 10,
51
+ "I-b_DESC+b_TITREP": 13,
52
+ "I-b_PER+O": 1,
53
+ "I-b_PER+b_TITREH": 3,
54
+ "I-b_SPAT+O": 16,
55
+ "I-b_SPAT+b_CARDINAL": 21,
56
+ "I-b_SPAT+b_FT": 24,
57
+ "I-b_SPAT+b_LOC": 18,
58
+ "I-b_TITRE+O": 27,
59
+ "I-i_ACT+O": 7,
60
+ "I-i_DESC+O": 9,
61
+ "I-i_DESC+b_ACT": 11,
62
+ "I-i_DESC+b_TITREP": 14,
63
+ "I-i_DESC+i_ACT": 12,
64
+ "I-i_DESC+i_TITREP": 15,
65
+ "I-i_PER+O": 2,
66
+ "I-i_PER+b_TITREH": 4,
67
+ "I-i_PER+i_TITREH": 5,
68
+ "I-i_SPAT+O": 17,
69
+ "I-i_SPAT+b_CARDINAL": 22,
70
+ "I-i_SPAT+b_FT": 25,
71
+ "I-i_SPAT+b_LOC": 19,
72
+ "I-i_SPAT+i_CARDINAL": 23,
73
+ "I-i_SPAT+i_FT": 26,
74
+ "I-i_SPAT+i_LOC": 20,
75
+ "I-i_TITRE+O": 28,
76
+ "O+O": 0
77
+ },
78
+ "layer_norm_eps": 1e-05,
79
+ "max_position_embeddings": 514,
80
+ "model_type": "camembert",
81
+ "num_attention_heads": 12,
82
+ "num_hidden_layers": 12,
83
+ "output_past": true,
84
+ "pad_token_id": 1,
85
+ "position_embedding_type": "absolute",
86
+ "torch_dtype": "float32",
87
+ "transformers_version": "4.25.1",
88
+ "type_vocab_size": 1,
89
+ "use_cache": true,
90
+ "vocab_size": 32005
91
+ }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9db1f8ba0c8e27a51f2c4c8112ed5e71eb5d817bd45575f3c7d73cff702cfb3b
3
+ size 880544613
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98b2dcd2c1f57b79c5e5c495c7f0f3d12b1bb5933142597cfaf539be8312521f
3
+ size 440285681
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67e172e9e6fdfd5d0cd07e1476cba228f9ae54616ac2e5a17d6b394ef1963283
3
+ size 14503
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3348d57e33a2df56ff570fa06068a10b38e92e5d9370fb65ef4dc6aceb702906
3
+ size 623
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:988bc5a00281c6d210a5d34bd143d0363741a432fefe741bf71e61b1869d4314
3
+ size 810912
special_tokens_map.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": "<mask>",
10
+ "pad_token": "<pad>",
11
+ "sep_token": "</s>",
12
+ "unk_token": "<unk>"
13
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": {
10
+ "__type": "AddedToken",
11
+ "content": "<mask>",
12
+ "lstrip": true,
13
+ "normalized": true,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ "model_max_length": 512,
18
+ "name_or_path": "HueyNemud/das22-10-camembert_pretrained",
19
+ "pad_token": "<pad>",
20
+ "sep_token": "</s>",
21
+ "sp_model_kwargs": {},
22
+ "special_tokens_map_file": "/lrde/home2/jchazalo/.cache/huggingface/transformers/fe0e213c44079a9ee091098f81fff2941484006e9ba3001a9bf1ee9f87537599.cb3ec3a6c1200d181228d8825ae9767572abca54efa1bbb37fd83d721b2ef323",
23
+ "tokenizer_class": "CamembertTokenizer",
24
+ "unk_token": "<unk>"
25
+ }
trainer_state.json ADDED
@@ -0,0 +1,1484 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9732283464566929,
3
+ "best_model_checkpoint": "/work/stual/res_ICDAR/method_3/tmp/314-pretrained-camembert-ner-hierarchical-loss-iob2/checkpoint-1400",
4
+ "epoch": 3.674540682414698,
5
+ "global_step": 1400,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.26,
12
+ "eval_ACT": {
13
+ "f1": 0.8992673992673993,
14
+ "number": 519,
15
+ "precision": 0.8568935427574171,
16
+ "recall": 0.9460500963391136
17
+ },
18
+ "eval_ACT_L1": {
19
+ "f1": 0.912639405204461,
20
+ "number": 503,
21
+ "precision": 0.8568935427574171,
22
+ "recall": 0.9761431411530815
23
+ },
24
+ "eval_ACT_L2": {
25
+ "f1": 0.0,
26
+ "number": 16,
27
+ "precision": 0.0,
28
+ "recall": 0.0
29
+ },
30
+ "eval_CARDINAL": {
31
+ "f1": 0.9816041206769685,
32
+ "number": 678,
33
+ "precision": 0.9794419970631424,
34
+ "recall": 0.9837758112094396
35
+ },
36
+ "eval_DESC": {
37
+ "f1": 0.0,
38
+ "number": 30,
39
+ "precision": 0.0,
40
+ "recall": 0.0
41
+ },
42
+ "eval_FT": {
43
+ "f1": 0.0,
44
+ "number": 7,
45
+ "precision": 0.0,
46
+ "recall": 0.0
47
+ },
48
+ "eval_LOC": {
49
+ "f1": 0.9583333333333334,
50
+ "number": 762,
51
+ "precision": 0.9509043927648578,
52
+ "recall": 0.9658792650918635
53
+ },
54
+ "eval_PER": {
55
+ "f1": 0.9560117302052786,
56
+ "number": 676,
57
+ "precision": 0.9476744186046512,
58
+ "recall": 0.9644970414201184
59
+ },
60
+ "eval_SPAT": {
61
+ "f1": 0.9562724014336917,
62
+ "number": 694,
63
+ "precision": 0.9514978601997147,
64
+ "recall": 0.9610951008645533
65
+ },
66
+ "eval_TITRE": {
67
+ "f1": 0.0,
68
+ "number": 2,
69
+ "precision": 0.0,
70
+ "recall": 0.0
71
+ },
72
+ "eval_TITREH": {
73
+ "f1": 0.0,
74
+ "number": 33,
75
+ "precision": 0.0,
76
+ "recall": 0.0
77
+ },
78
+ "eval_TITREP": {
79
+ "f1": 0.0,
80
+ "number": 6,
81
+ "precision": 0.0,
82
+ "recall": 0.0
83
+ },
84
+ "eval_accuracy": 0.9404170804369414,
85
+ "eval_accuracy-all": 0.9610228401191658,
86
+ "eval_accuracy-das": 0.9565541211519365,
87
+ "eval_accuracy-l1": 0.9500993048659384,
88
+ "eval_accuracy-l1l2": 0.9407894736842105,
89
+ "eval_accuracy-l2": 0.9719463753723933,
90
+ "eval_f1": 0.9438787055894999,
91
+ "eval_f1-all": 0.9416764361078547,
92
+ "eval_f1-das": 0.9402153731897512,
93
+ "eval_f1-l1": 0.9361261960175847,
94
+ "eval_f1-l1l2": 0.9384570933256284,
95
+ "eval_f1-l2": 0.9489347311464321,
96
+ "eval_loss": 0.6206728219985962,
97
+ "eval_precision": 0.9473086531910061,
98
+ "eval_precision-all": 0.9402985074626866,
99
+ "eval_precision-das": 0.9370836417468542,
100
+ "eval_precision-l1": 0.9225280326197758,
101
+ "eval_precision-l1l2": 0.9368329968272282,
102
+ "eval_precision-l2": 0.9642611683848797,
103
+ "eval_recall": 0.9404735062006765,
104
+ "eval_recall-all": 0.9430584091576166,
105
+ "eval_recall-das": 0.9433681073025335,
106
+ "eval_recall-l1": 0.9501312335958005,
107
+ "eval_recall-l1l2": 0.9400868306801736,
108
+ "eval_recall-l2": 0.9340878828229028,
109
+ "eval_runtime": 7.1724,
110
+ "eval_samples_per_second": 94.251,
111
+ "eval_steps_per_second": 5.995,
112
+ "step": 100
113
+ },
114
+ {
115
+ "epoch": 0.52,
116
+ "eval_ACT": {
117
+ "f1": 0.9291784702549574,
118
+ "number": 519,
119
+ "precision": 0.9111111111111111,
120
+ "recall": 0.9479768786127167
121
+ },
122
+ "eval_ACT_L1": {
123
+ "f1": 0.9434324065196549,
124
+ "number": 503,
125
+ "precision": 0.9111111111111111,
126
+ "recall": 0.9781312127236581
127
+ },
128
+ "eval_ACT_L2": {
129
+ "f1": 0.0,
130
+ "number": 16,
131
+ "precision": 0.0,
132
+ "recall": 0.0
133
+ },
134
+ "eval_CARDINAL": {
135
+ "f1": 0.9919058130978661,
136
+ "number": 678,
137
+ "precision": 0.9897209985315712,
138
+ "recall": 0.9941002949852508
139
+ },
140
+ "eval_DESC": {
141
+ "f1": 0.3103448275862069,
142
+ "number": 30,
143
+ "precision": 0.32142857142857145,
144
+ "recall": 0.3
145
+ },
146
+ "eval_FT": {
147
+ "f1": 0.0,
148
+ "number": 7,
149
+ "precision": 0.0,
150
+ "recall": 0.0
151
+ },
152
+ "eval_LOC": {
153
+ "f1": 0.9521345407503234,
154
+ "number": 762,
155
+ "precision": 0.9387755102040817,
156
+ "recall": 0.9658792650918635
157
+ },
158
+ "eval_PER": {
159
+ "f1": 0.983050847457627,
160
+ "number": 676,
161
+ "precision": 0.9794419970631424,
162
+ "recall": 0.9866863905325444
163
+ },
164
+ "eval_SPAT": {
165
+ "f1": 0.9542857142857143,
166
+ "number": 694,
167
+ "precision": 0.9461756373937678,
168
+ "recall": 0.962536023054755
169
+ },
170
+ "eval_TITRE": {
171
+ "f1": 0.0,
172
+ "number": 2,
173
+ "precision": 0.0,
174
+ "recall": 0.0
175
+ },
176
+ "eval_TITREH": {
177
+ "f1": 0.43373493975903615,
178
+ "number": 33,
179
+ "precision": 0.36,
180
+ "recall": 0.5454545454545454
181
+ },
182
+ "eval_TITREP": {
183
+ "f1": 0.0,
184
+ "number": 6,
185
+ "precision": 0.0,
186
+ "recall": 0.0
187
+ },
188
+ "eval_accuracy": 0.951837140019861,
189
+ "eval_accuracy-all": 0.9676017874875869,
190
+ "eval_accuracy-das": 0.9716981132075472,
191
+ "eval_accuracy-l1": 0.9602780536246276,
192
+ "eval_accuracy-l1l2": 0.9524577954319762,
193
+ "eval_accuracy-l2": 0.9749255213505462,
194
+ "eval_f1": 0.9533235856484086,
195
+ "eval_f1-all": 0.9492511269448888,
196
+ "eval_f1-das": 0.9659385412810071,
197
+ "eval_f1-l1": 0.9512953367875648,
198
+ "eval_f1-l1l2": 0.9528720813637014,
199
+ "eval_f1-l2": 0.9466357308584686,
200
+ "eval_loss": 0.3473620116710663,
201
+ "eval_precision": 0.9510771992818672,
202
+ "eval_precision-all": 0.9406340057636887,
203
+ "eval_precision-das": 0.9598969830757911,
204
+ "eval_precision-l1": 0.9391304347826087,
205
+ "eval_precision-l1l2": 0.9432785025524674,
206
+ "eval_precision-l2": 0.9425742574257425,
207
+ "eval_recall": 0.9555806087936866,
208
+ "eval_recall-all": 0.9580275902553567,
209
+ "eval_recall-das": 0.9720566318926974,
210
+ "eval_recall-l1": 0.9637795275590552,
211
+ "eval_recall-l1l2": 0.9626628075253256,
212
+ "eval_recall-l2": 0.9507323568575233,
213
+ "eval_runtime": 7.1425,
214
+ "eval_samples_per_second": 94.645,
215
+ "eval_steps_per_second": 6.02,
216
+ "step": 200
217
+ },
218
+ {
219
+ "epoch": 0.79,
220
+ "eval_ACT": {
221
+ "f1": 0.9467680608365019,
222
+ "number": 519,
223
+ "precision": 0.9343339587242027,
224
+ "recall": 0.9595375722543352
225
+ },
226
+ "eval_ACT_L1": {
227
+ "f1": 0.9613899613899614,
228
+ "number": 503,
229
+ "precision": 0.9343339587242027,
230
+ "recall": 0.9900596421471173
231
+ },
232
+ "eval_ACT_L2": {
233
+ "f1": 0.0,
234
+ "number": 16,
235
+ "precision": 0.0,
236
+ "recall": 0.0
237
+ },
238
+ "eval_CARDINAL": {
239
+ "f1": 0.9933774834437086,
240
+ "number": 678,
241
+ "precision": 0.9911894273127754,
242
+ "recall": 0.995575221238938
243
+ },
244
+ "eval_DESC": {
245
+ "f1": 0.22580645161290322,
246
+ "number": 30,
247
+ "precision": 0.21875,
248
+ "recall": 0.23333333333333334
249
+ },
250
+ "eval_FT": {
251
+ "f1": 0.0,
252
+ "number": 7,
253
+ "precision": 0.0,
254
+ "recall": 0.0
255
+ },
256
+ "eval_LOC": {
257
+ "f1": 0.9609882964889467,
258
+ "number": 762,
259
+ "precision": 0.9523195876288659,
260
+ "recall": 0.9698162729658792
261
+ },
262
+ "eval_PER": {
263
+ "f1": 0.9808541973490428,
264
+ "number": 676,
265
+ "precision": 0.9765395894428153,
266
+ "recall": 0.985207100591716
267
+ },
268
+ "eval_SPAT": {
269
+ "f1": 0.9700000000000001,
270
+ "number": 694,
271
+ "precision": 0.9617563739376771,
272
+ "recall": 0.978386167146974
273
+ },
274
+ "eval_TITRE": {
275
+ "f1": 0.0,
276
+ "number": 2,
277
+ "precision": 0.0,
278
+ "recall": 0.0
279
+ },
280
+ "eval_TITREH": {
281
+ "f1": 0.6756756756756757,
282
+ "number": 33,
283
+ "precision": 0.6097560975609756,
284
+ "recall": 0.7575757575757576
285
+ },
286
+ "eval_TITREP": {
287
+ "f1": 0.6,
288
+ "number": 6,
289
+ "precision": 0.75,
290
+ "recall": 0.5
291
+ },
292
+ "eval_accuracy": 0.9551886792452831,
293
+ "eval_accuracy-all": 0.9682845084409136,
294
+ "eval_accuracy-das": 0.9759185700099305,
295
+ "eval_accuracy-l1": 0.9617676266137041,
296
+ "eval_accuracy-l1l2": 0.9554369414101291,
297
+ "eval_accuracy-l2": 0.9748013902681232,
298
+ "eval_f1": 0.9625788999098286,
299
+ "eval_f1-all": 0.9594870300204023,
300
+ "eval_f1-das": 0.9718100890207715,
301
+ "eval_f1-l1": 0.9590461378952824,
302
+ "eval_f1-l1l2": 0.9622695852534562,
303
+ "eval_f1-l2": 0.9600532623169108,
304
+ "eval_loss": 0.24261289834976196,
305
+ "eval_precision": 0.9623619562767636,
306
+ "eval_precision-all": 0.952821997105644,
307
+ "eval_precision-das": 0.9675036927621861,
308
+ "eval_precision-l1": 0.9472606246799795,
309
+ "eval_precision-l1l2": 0.9575809687589567,
310
+ "eval_precision-l2": 0.9600532623169108,
311
+ "eval_recall": 0.9627959413754228,
312
+ "eval_recall-all": 0.9662459641913707,
313
+ "eval_recall-das": 0.9761549925484352,
314
+ "eval_recall-l1": 0.9711286089238845,
315
+ "eval_recall-l1l2": 0.9670043415340087,
316
+ "eval_recall-l2": 0.9600532623169108,
317
+ "eval_runtime": 8.0913,
318
+ "eval_samples_per_second": 83.547,
319
+ "eval_steps_per_second": 5.314,
320
+ "step": 300
321
+ },
322
+ {
323
+ "epoch": 1.05,
324
+ "eval_ACT": {
325
+ "f1": 0.9337121212121212,
326
+ "number": 519,
327
+ "precision": 0.9180633147113594,
328
+ "recall": 0.9499036608863198
329
+ },
330
+ "eval_ACT_L1": {
331
+ "f1": 0.9480769230769232,
332
+ "number": 503,
333
+ "precision": 0.9180633147113594,
334
+ "recall": 0.9801192842942346
335
+ },
336
+ "eval_ACT_L2": {
337
+ "f1": 0.0,
338
+ "number": 16,
339
+ "precision": 0.0,
340
+ "recall": 0.0
341
+ },
342
+ "eval_CARDINAL": {
343
+ "f1": 0.9933774834437086,
344
+ "number": 678,
345
+ "precision": 0.9911894273127754,
346
+ "recall": 0.995575221238938
347
+ },
348
+ "eval_DESC": {
349
+ "f1": 0.21951219512195122,
350
+ "number": 30,
351
+ "precision": 0.17307692307692307,
352
+ "recall": 0.3
353
+ },
354
+ "eval_FT": {
355
+ "f1": 0.2,
356
+ "number": 7,
357
+ "precision": 0.3333333333333333,
358
+ "recall": 0.14285714285714285
359
+ },
360
+ "eval_LOC": {
361
+ "f1": 0.9583875162548764,
362
+ "number": 762,
363
+ "precision": 0.9497422680412371,
364
+ "recall": 0.9671916010498688
365
+ },
366
+ "eval_PER": {
367
+ "f1": 0.9889298892988929,
368
+ "number": 676,
369
+ "precision": 0.9867452135493373,
370
+ "recall": 0.9911242603550295
371
+ },
372
+ "eval_SPAT": {
373
+ "f1": 0.964924838940587,
374
+ "number": 694,
375
+ "precision": 0.9587482219061166,
376
+ "recall": 0.9711815561959655
377
+ },
378
+ "eval_TITRE": {
379
+ "f1": 0.0,
380
+ "number": 2,
381
+ "precision": 0.0,
382
+ "recall": 0.0
383
+ },
384
+ "eval_TITREH": {
385
+ "f1": 0.9117647058823529,
386
+ "number": 33,
387
+ "precision": 0.8857142857142857,
388
+ "recall": 0.9393939393939394
389
+ },
390
+ "eval_TITREP": {
391
+ "f1": 0.6153846153846153,
392
+ "number": 6,
393
+ "precision": 0.5714285714285714,
394
+ "recall": 0.6666666666666666
395
+ },
396
+ "eval_accuracy": 0.961395233366435,
397
+ "eval_accuracy-all": 0.9726911618669315,
398
+ "eval_accuracy-das": 0.9774081429990069,
399
+ "eval_accuracy-l1": 0.9667328699106256,
400
+ "eval_accuracy-l1l2": 0.9620158887785502,
401
+ "eval_accuracy-l2": 0.9786494538232373,
402
+ "eval_f1": 0.9638120926050797,
403
+ "eval_f1-all": 0.9575581395348837,
404
+ "eval_f1-das": 0.9719799591760996,
405
+ "eval_f1-l1": 0.9525283797729618,
406
+ "eval_f1-l1l2": 0.962516156828953,
407
+ "eval_f1-l2": 0.9640479360852197,
408
+ "eval_loss": 0.1985810250043869,
409
+ "eval_precision": 0.9607887071476585,
410
+ "eval_precision-all": 0.9484595450619061,
411
+ "eval_precision-das": 0.9682070240295748,
412
+ "eval_precision-l1": 0.9365804160324708,
413
+ "eval_precision-l1l2": 0.9552451539338654,
414
+ "eval_precision-l2": 0.9640479360852197,
415
+ "eval_recall": 0.9668545659526494,
416
+ "eval_recall-all": 0.966832990901086,
417
+ "eval_recall-das": 0.9757824143070045,
418
+ "eval_recall-l1": 0.9690288713910761,
419
+ "eval_recall-l1l2": 0.9698986975397974,
420
+ "eval_recall-l2": 0.9640479360852197,
421
+ "eval_runtime": 6.8598,
422
+ "eval_samples_per_second": 98.545,
423
+ "eval_steps_per_second": 6.268,
424
+ "step": 400
425
+ },
426
+ {
427
+ "epoch": 1.31,
428
+ "learning_rate": 9e-05,
429
+ "loss": 0.5596,
430
+ "step": 500
431
+ },
432
+ {
433
+ "epoch": 1.31,
434
+ "eval_ACT": {
435
+ "f1": 0.9334600760456274,
436
+ "number": 519,
437
+ "precision": 0.9212007504690432,
438
+ "recall": 0.9460500963391136
439
+ },
440
+ "eval_ACT_L1": {
441
+ "f1": 0.948792270531401,
442
+ "number": 503,
443
+ "precision": 0.9229323308270677,
444
+ "recall": 0.9761431411530815
445
+ },
446
+ "eval_ACT_L2": {
447
+ "f1": 0.0,
448
+ "number": 16,
449
+ "precision": 0.0,
450
+ "recall": 0.0
451
+ },
452
+ "eval_CARDINAL": {
453
+ "f1": 0.9933774834437086,
454
+ "number": 678,
455
+ "precision": 0.9911894273127754,
456
+ "recall": 0.995575221238938
457
+ },
458
+ "eval_DESC": {
459
+ "f1": 0.2758620689655172,
460
+ "number": 30,
461
+ "precision": 0.2857142857142857,
462
+ "recall": 0.26666666666666666
463
+ },
464
+ "eval_FT": {
465
+ "f1": 0.36363636363636365,
466
+ "number": 7,
467
+ "precision": 0.5,
468
+ "recall": 0.2857142857142857
469
+ },
470
+ "eval_LOC": {
471
+ "f1": 0.9538661468486029,
472
+ "number": 762,
473
+ "precision": 0.9446589446589446,
474
+ "recall": 0.963254593175853
475
+ },
476
+ "eval_PER": {
477
+ "f1": 0.9734904270986746,
478
+ "number": 676,
479
+ "precision": 0.969208211143695,
480
+ "recall": 0.977810650887574
481
+ },
482
+ "eval_SPAT": {
483
+ "f1": 0.9549678341672624,
484
+ "number": 694,
485
+ "precision": 0.9475177304964539,
486
+ "recall": 0.962536023054755
487
+ },
488
+ "eval_TITRE": {
489
+ "f1": 0.0,
490
+ "number": 2,
491
+ "precision": 0.0,
492
+ "recall": 0.0
493
+ },
494
+ "eval_TITREH": {
495
+ "f1": 0.8571428571428571,
496
+ "number": 33,
497
+ "precision": 0.8108108108108109,
498
+ "recall": 0.9090909090909091
499
+ },
500
+ "eval_TITREP": {
501
+ "f1": 0.4615384615384615,
502
+ "number": 6,
503
+ "precision": 0.42857142857142855,
504
+ "recall": 0.5
505
+ },
506
+ "eval_accuracy": 0.961643495531281,
507
+ "eval_accuracy-all": 0.9728152929493545,
508
+ "eval_accuracy-das": 0.9765392254220456,
509
+ "eval_accuracy-l1": 0.9676017874875869,
510
+ "eval_accuracy-l1l2": 0.9621400198609732,
511
+ "eval_accuracy-l2": 0.9780287984111221,
512
+ "eval_f1": 0.9624465932089048,
513
+ "eval_f1-all": 0.9537968226206093,
514
+ "eval_f1-das": 0.9642393922549565,
515
+ "eval_f1-l1": 0.949117341640706,
516
+ "eval_f1-l1l2": 0.958699093394733,
517
+ "eval_f1-l2": 0.9597873047524094,
518
+ "eval_loss": 0.18591071665287018,
519
+ "eval_precision": 0.9598564700605517,
520
+ "eval_precision-all": 0.9473074696004632,
521
+ "eval_precision-das": 0.9590858827865831,
522
+ "eval_precision-l1": 0.9388803287108372,
523
+ "eval_precision-l1l2": 0.9533485975958786,
524
+ "eval_precision-l2": 0.9581950895819509,
525
+ "eval_recall": 0.9650507328072153,
526
+ "eval_recall-all": 0.9603756970942178,
527
+ "eval_recall-das": 0.9694485842026825,
528
+ "eval_recall-l1": 0.9595800524934384,
529
+ "eval_recall-l1l2": 0.96410998552822,
530
+ "eval_recall-l2": 0.9613848202396804,
531
+ "eval_runtime": 7.193,
532
+ "eval_samples_per_second": 93.98,
533
+ "eval_steps_per_second": 5.978,
534
+ "step": 500
535
+ },
536
+ {
537
+ "epoch": 1.57,
538
+ "eval_ACT": {
539
+ "f1": 0.9419600380589914,
540
+ "number": 519,
541
+ "precision": 0.9304511278195489,
542
+ "recall": 0.953757225433526
543
+ },
544
+ "eval_ACT_L1": {
545
+ "f1": 0.9573643410852714,
546
+ "number": 503,
547
+ "precision": 0.9338374291115312,
548
+ "recall": 0.9821073558648111
549
+ },
550
+ "eval_ACT_L2": {
551
+ "f1": 0.10526315789473684,
552
+ "number": 16,
553
+ "precision": 0.3333333333333333,
554
+ "recall": 0.0625
555
+ },
556
+ "eval_CARDINAL": {
557
+ "f1": 0.9933774834437086,
558
+ "number": 678,
559
+ "precision": 0.9911894273127754,
560
+ "recall": 0.995575221238938
561
+ },
562
+ "eval_DESC": {
563
+ "f1": 0.30985915492957744,
564
+ "number": 30,
565
+ "precision": 0.2682926829268293,
566
+ "recall": 0.36666666666666664
567
+ },
568
+ "eval_FT": {
569
+ "f1": 0.30769230769230765,
570
+ "number": 7,
571
+ "precision": 0.3333333333333333,
572
+ "recall": 0.2857142857142857
573
+ },
574
+ "eval_LOC": {
575
+ "f1": 0.9487345879299156,
576
+ "number": 762,
577
+ "precision": 0.938382541720154,
578
+ "recall": 0.9593175853018373
579
+ },
580
+ "eval_PER": {
581
+ "f1": 0.9823008849557522,
582
+ "number": 676,
583
+ "precision": 0.9794117647058823,
584
+ "recall": 0.985207100591716
585
+ },
586
+ "eval_SPAT": {
587
+ "f1": 0.9590222861250898,
588
+ "number": 694,
589
+ "precision": 0.9569583931133429,
590
+ "recall": 0.9610951008645533
591
+ },
592
+ "eval_TITRE": {
593
+ "f1": 0.0,
594
+ "number": 2,
595
+ "precision": 0.0,
596
+ "recall": 0.0
597
+ },
598
+ "eval_TITREH": {
599
+ "f1": 0.9117647058823529,
600
+ "number": 33,
601
+ "precision": 0.8857142857142857,
602
+ "recall": 0.9393939393939394
603
+ },
604
+ "eval_TITREP": {
605
+ "f1": 0.5714285714285715,
606
+ "number": 6,
607
+ "precision": 0.5,
608
+ "recall": 0.6666666666666666
609
+ },
610
+ "eval_accuracy": 0.9654915590863953,
611
+ "eval_accuracy-all": 0.9756703078450845,
612
+ "eval_accuracy-das": 0.9801390268123138,
613
+ "eval_accuracy-l1": 0.9725670307845085,
614
+ "eval_accuracy-l1l2": 0.9663604766633564,
615
+ "eval_accuracy-l2": 0.9787735849056604,
616
+ "eval_f1": 0.9630793401413982,
617
+ "eval_f1-all": 0.9560151471016604,
618
+ "eval_f1-das": 0.9725213516524323,
619
+ "eval_f1-l1": 0.9543094496365525,
620
+ "eval_f1-l1l2": 0.9620471535365152,
621
+ "eval_f1-l2": 0.958195089581951,
622
+ "eval_loss": 0.14890924096107483,
623
+ "eval_precision": 0.9586684539767649,
624
+ "eval_precision-all": 0.9488291413703382,
625
+ "eval_precision-das": 0.9692820133234641,
626
+ "eval_precision-l1": 0.9440164355418593,
627
+ "eval_precision-l1l2": 0.9557269351613824,
628
+ "eval_precision-l2": 0.955026455026455,
629
+ "eval_recall": 0.9675310033821871,
630
+ "eval_recall-all": 0.9633108306427942,
631
+ "eval_recall-das": 0.9757824143070045,
632
+ "eval_recall-l1": 0.9648293963254593,
633
+ "eval_recall-l1l2": 0.968451519536903,
634
+ "eval_recall-l2": 0.9613848202396804,
635
+ "eval_runtime": 6.5579,
636
+ "eval_samples_per_second": 103.082,
637
+ "eval_steps_per_second": 6.557,
638
+ "step": 600
639
+ },
640
+ {
641
+ "epoch": 1.84,
642
+ "eval_ACT": {
643
+ "f1": 0.9421800947867298,
644
+ "number": 519,
645
+ "precision": 0.9272388059701493,
646
+ "recall": 0.9576107899807321
647
+ },
648
+ "eval_ACT_L1": {
649
+ "f1": 0.9573643410852714,
650
+ "number": 503,
651
+ "precision": 0.9338374291115312,
652
+ "recall": 0.9821073558648111
653
+ },
654
+ "eval_ACT_L2": {
655
+ "f1": 0.26086956521739124,
656
+ "number": 16,
657
+ "precision": 0.42857142857142855,
658
+ "recall": 0.1875
659
+ },
660
+ "eval_CARDINAL": {
661
+ "f1": 0.9933774834437086,
662
+ "number": 678,
663
+ "precision": 0.9911894273127754,
664
+ "recall": 0.995575221238938
665
+ },
666
+ "eval_DESC": {
667
+ "f1": 0.4126984126984127,
668
+ "number": 30,
669
+ "precision": 0.3939393939393939,
670
+ "recall": 0.43333333333333335
671
+ },
672
+ "eval_FT": {
673
+ "f1": 0.3333333333333333,
674
+ "number": 7,
675
+ "precision": 0.4,
676
+ "recall": 0.2857142857142857
677
+ },
678
+ "eval_LOC": {
679
+ "f1": 0.9566343042071198,
680
+ "number": 762,
681
+ "precision": 0.9438058748403576,
682
+ "recall": 0.9698162729658792
683
+ },
684
+ "eval_PER": {
685
+ "f1": 0.9852507374631269,
686
+ "number": 676,
687
+ "precision": 0.9823529411764705,
688
+ "recall": 0.9881656804733728
689
+ },
690
+ "eval_SPAT": {
691
+ "f1": 0.9634931997136722,
692
+ "number": 694,
693
+ "precision": 0.957325746799431,
694
+ "recall": 0.9697406340057637
695
+ },
696
+ "eval_TITRE": {
697
+ "f1": 0.0,
698
+ "number": 2,
699
+ "precision": 0.0,
700
+ "recall": 0.0
701
+ },
702
+ "eval_TITREH": {
703
+ "f1": 0.927536231884058,
704
+ "number": 33,
705
+ "precision": 0.8888888888888888,
706
+ "recall": 0.9696969696969697
707
+ },
708
+ "eval_TITREP": {
709
+ "f1": 0.3333333333333333,
710
+ "number": 6,
711
+ "precision": 0.3333333333333333,
712
+ "recall": 0.3333333333333333
713
+ },
714
+ "eval_accuracy": 0.9669811320754716,
715
+ "eval_accuracy-all": 0.9762288977159881,
716
+ "eval_accuracy-das": 0.980759682224429,
717
+ "eval_accuracy-l1": 0.9724428997020854,
718
+ "eval_accuracy-l1l2": 0.9677259185700099,
719
+ "eval_accuracy-l2": 0.9800148957298908,
720
+ "eval_f1": 0.9667938074938299,
721
+ "eval_f1-all": 0.9609898107714702,
722
+ "eval_f1-das": 0.9720111214087118,
723
+ "eval_f1-l1": 0.96,
724
+ "eval_f1-l1l2": 0.964824120603015,
725
+ "eval_f1-l2": 0.9622516556291391,
726
+ "eval_loss": 0.15314123034477234,
727
+ "eval_precision": 0.962045099352534,
728
+ "eval_precision-all": 0.9532197516604101,
729
+ "eval_precision-das": 0.967170785687938,
730
+ "eval_precision-l1": 0.9501285347043702,
731
+ "eval_precision-l1l2": 0.9572649572649573,
732
+ "eval_precision-l2": 0.9571805006587615,
733
+ "eval_recall": 0.9715896279594137,
734
+ "eval_recall-all": 0.9688875843850895,
735
+ "eval_recall-das": 0.9769001490312966,
736
+ "eval_recall-l1": 0.9700787401574803,
737
+ "eval_recall-l1l2": 0.9725036179450073,
738
+ "eval_recall-l2": 0.9673768308921438,
739
+ "eval_runtime": 7.6675,
740
+ "eval_samples_per_second": 88.164,
741
+ "eval_steps_per_second": 5.608,
742
+ "step": 700
743
+ },
744
+ {
745
+ "epoch": 2.1,
746
+ "eval_ACT": {
747
+ "f1": 0.9300567107750471,
748
+ "number": 519,
749
+ "precision": 0.9128014842300557,
750
+ "recall": 0.9479768786127167
751
+ },
752
+ "eval_ACT_L1": {
753
+ "f1": 0.9568627450980391,
754
+ "number": 503,
755
+ "precision": 0.9439071566731141,
756
+ "recall": 0.9701789264413518
757
+ },
758
+ "eval_ACT_L2": {
759
+ "f1": 0.2105263157894737,
760
+ "number": 16,
761
+ "precision": 0.18181818181818182,
762
+ "recall": 0.25
763
+ },
764
+ "eval_CARDINAL": {
765
+ "f1": 0.9933774834437086,
766
+ "number": 678,
767
+ "precision": 0.9911894273127754,
768
+ "recall": 0.995575221238938
769
+ },
770
+ "eval_DESC": {
771
+ "f1": 0.37499999999999994,
772
+ "number": 30,
773
+ "precision": 0.3,
774
+ "recall": 0.5
775
+ },
776
+ "eval_FT": {
777
+ "f1": 0.3333333333333333,
778
+ "number": 7,
779
+ "precision": 0.4,
780
+ "recall": 0.2857142857142857
781
+ },
782
+ "eval_LOC": {
783
+ "f1": 0.9635890767230169,
784
+ "number": 762,
785
+ "precision": 0.9548969072164949,
786
+ "recall": 0.9724409448818898
787
+ },
788
+ "eval_PER": {
789
+ "f1": 0.986019131714496,
790
+ "number": 676,
791
+ "precision": 0.9809663250366032,
792
+ "recall": 0.9911242603550295
793
+ },
794
+ "eval_SPAT": {
795
+ "f1": 0.9591982820329277,
796
+ "number": 694,
797
+ "precision": 0.9530583214793741,
798
+ "recall": 0.9654178674351584
799
+ },
800
+ "eval_TITRE": {
801
+ "f1": 0.0,
802
+ "number": 2,
803
+ "precision": 0.0,
804
+ "recall": 0.0
805
+ },
806
+ "eval_TITREH": {
807
+ "f1": 0.9090909090909091,
808
+ "number": 33,
809
+ "precision": 0.9090909090909091,
810
+ "recall": 0.9090909090909091
811
+ },
812
+ "eval_TITREP": {
813
+ "f1": 0.6153846153846153,
814
+ "number": 6,
815
+ "precision": 0.5714285714285714,
816
+ "recall": 0.6666666666666666
817
+ },
818
+ "eval_accuracy": 0.9632571996027806,
819
+ "eval_accuracy-all": 0.9734980139026812,
820
+ "eval_accuracy-das": 0.9815044687189672,
821
+ "eval_accuracy-l1": 0.9703326713008937,
822
+ "eval_accuracy-l1l2": 0.9643743793445879,
823
+ "eval_accuracy-l2": 0.9766633565044687,
824
+ "eval_f1": 0.9649299719887955,
825
+ "eval_f1-all": 0.9584543869843115,
826
+ "eval_f1-das": 0.9727323316638843,
827
+ "eval_f1-l1": 0.9554173146708138,
828
+ "eval_f1-l1l2": 0.9624534250501576,
829
+ "eval_f1-l2": 0.9623265036351619,
830
+ "eval_loss": 0.13265174627304077,
831
+ "eval_precision": 0.9590200445434298,
832
+ "eval_precision-all": 0.9488064423353466,
833
+ "eval_precision-das": 0.9685999261174733,
834
+ "eval_precision-l1": 0.9436763952892985,
835
+ "eval_precision-l1l2": 0.9531649162645472,
836
+ "eval_precision-l2": 0.9553805774278216,
837
+ "eval_recall": 0.970913190529876,
838
+ "eval_recall-all": 0.9683005576753743,
839
+ "eval_recall-das": 0.9769001490312966,
840
+ "eval_recall-l1": 0.9674540682414698,
841
+ "eval_recall-l1l2": 0.9719247467438495,
842
+ "eval_recall-l2": 0.9693741677762983,
843
+ "eval_runtime": 7.359,
844
+ "eval_samples_per_second": 91.86,
845
+ "eval_steps_per_second": 5.843,
846
+ "step": 800
847
+ },
848
+ {
849
+ "epoch": 2.36,
850
+ "eval_ACT": {
851
+ "f1": 0.9409559512652297,
852
+ "number": 519,
853
+ "precision": 0.916058394160584,
854
+ "recall": 0.9672447013487476
855
+ },
856
+ "eval_ACT_L1": {
857
+ "f1": 0.96484375,
858
+ "number": 503,
859
+ "precision": 0.9481765834932822,
860
+ "recall": 0.9821073558648111
861
+ },
862
+ "eval_ACT_L2": {
863
+ "f1": 0.37209302325581395,
864
+ "number": 16,
865
+ "precision": 0.2962962962962963,
866
+ "recall": 0.5
867
+ },
868
+ "eval_CARDINAL": {
869
+ "f1": 0.9933774834437086,
870
+ "number": 678,
871
+ "precision": 0.9911894273127754,
872
+ "recall": 0.995575221238938
873
+ },
874
+ "eval_DESC": {
875
+ "f1": 0.47368421052631576,
876
+ "number": 30,
877
+ "precision": 0.391304347826087,
878
+ "recall": 0.6
879
+ },
880
+ "eval_FT": {
881
+ "f1": 0.3333333333333333,
882
+ "number": 7,
883
+ "precision": 0.4,
884
+ "recall": 0.2857142857142857
885
+ },
886
+ "eval_LOC": {
887
+ "f1": 0.9609375,
888
+ "number": 762,
889
+ "precision": 0.9534883720930233,
890
+ "recall": 0.968503937007874
891
+ },
892
+ "eval_PER": {
893
+ "f1": 0.9852507374631269,
894
+ "number": 676,
895
+ "precision": 0.9823529411764705,
896
+ "recall": 0.9881656804733728
897
+ },
898
+ "eval_SPAT": {
899
+ "f1": 0.9597701149425288,
900
+ "number": 694,
901
+ "precision": 0.9570200573065902,
902
+ "recall": 0.962536023054755
903
+ },
904
+ "eval_TITRE": {
905
+ "f1": 0.0,
906
+ "number": 2,
907
+ "precision": 0.0,
908
+ "recall": 0.0
909
+ },
910
+ "eval_TITREH": {
911
+ "f1": 0.9253731343283583,
912
+ "number": 33,
913
+ "precision": 0.9117647058823529,
914
+ "recall": 0.9393939393939394
915
+ },
916
+ "eval_TITREP": {
917
+ "f1": 0.42857142857142855,
918
+ "number": 6,
919
+ "precision": 0.375,
920
+ "recall": 0.5
921
+ },
922
+ "eval_accuracy": 0.9653674280039722,
923
+ "eval_accuracy-all": 0.9744289970208541,
924
+ "eval_accuracy-das": 0.9823733862959285,
925
+ "eval_accuracy-l1": 0.9714498510427011,
926
+ "eval_accuracy-l1l2": 0.9663604766633564,
927
+ "eval_accuracy-l2": 0.9774081429990069,
928
+ "eval_f1": 0.9669171245934731,
929
+ "eval_f1-all": 0.960616189507339,
930
+ "eval_f1-das": 0.9740452354467927,
931
+ "eval_f1-l1": 0.96,
932
+ "eval_f1-l1l2": 0.9648745519713262,
933
+ "eval_f1-l2": 0.9613988782580007,
934
+ "eval_loss": 0.14285241067409515,
935
+ "eval_precision": 0.9618473895582329,
936
+ "eval_precision-all": 0.9513529073114565,
937
+ "eval_precision-das": 0.9693726937269372,
938
+ "eval_precision-l1": 0.9501285347043702,
939
+ "eval_precision-l1l2": 0.9559659090909091,
940
+ "eval_precision-l2": 0.9529103989535644,
941
+ "eval_recall": 0.9720405862457723,
942
+ "eval_recall-all": 0.9700616378045201,
943
+ "eval_recall-das": 0.9787630402384501,
944
+ "eval_recall-l1": 0.9700787401574803,
945
+ "eval_recall-l1l2": 0.9739507959479016,
946
+ "eval_recall-l2": 0.9700399467376831,
947
+ "eval_runtime": 7.5384,
948
+ "eval_samples_per_second": 89.674,
949
+ "eval_steps_per_second": 5.704,
950
+ "step": 900
951
+ },
952
+ {
953
+ "epoch": 2.62,
954
+ "learning_rate": 8e-05,
955
+ "loss": 0.1442,
956
+ "step": 1000
957
+ },
958
+ {
959
+ "epoch": 2.62,
960
+ "eval_ACT": {
961
+ "f1": 0.9571020019065777,
962
+ "number": 519,
963
+ "precision": 0.9471698113207547,
964
+ "recall": 0.9672447013487476
965
+ },
966
+ "eval_ACT_L1": {
967
+ "f1": 0.9782178217821782,
968
+ "number": 503,
969
+ "precision": 0.9743589743589743,
970
+ "recall": 0.9821073558648111
971
+ },
972
+ "eval_ACT_L2": {
973
+ "f1": 0.41025641025641024,
974
+ "number": 16,
975
+ "precision": 0.34782608695652173,
976
+ "recall": 0.5
977
+ },
978
+ "eval_CARDINAL": {
979
+ "f1": 0.9919058130978661,
980
+ "number": 678,
981
+ "precision": 0.9897209985315712,
982
+ "recall": 0.9941002949852508
983
+ },
984
+ "eval_DESC": {
985
+ "f1": 0.47368421052631576,
986
+ "number": 30,
987
+ "precision": 0.391304347826087,
988
+ "recall": 0.6
989
+ },
990
+ "eval_FT": {
991
+ "f1": 0.30769230769230765,
992
+ "number": 7,
993
+ "precision": 0.3333333333333333,
994
+ "recall": 0.2857142857142857
995
+ },
996
+ "eval_LOC": {
997
+ "f1": 0.9712041884816753,
998
+ "number": 762,
999
+ "precision": 0.9686684073107049,
1000
+ "recall": 0.973753280839895
1001
+ },
1002
+ "eval_PER": {
1003
+ "f1": 0.9867060561299853,
1004
+ "number": 676,
1005
+ "precision": 0.9852507374631269,
1006
+ "recall": 0.9881656804733728
1007
+ },
1008
+ "eval_SPAT": {
1009
+ "f1": 0.9621157969978557,
1010
+ "number": 694,
1011
+ "precision": 0.9546099290780142,
1012
+ "recall": 0.9697406340057637
1013
+ },
1014
+ "eval_TITRE": {
1015
+ "f1": 0.0,
1016
+ "number": 2,
1017
+ "precision": 0.0,
1018
+ "recall": 0.0
1019
+ },
1020
+ "eval_TITREH": {
1021
+ "f1": 0.9253731343283583,
1022
+ "number": 33,
1023
+ "precision": 0.9117647058823529,
1024
+ "recall": 0.9393939393939394
1025
+ },
1026
+ "eval_TITREP": {
1027
+ "f1": 0.42857142857142855,
1028
+ "number": 6,
1029
+ "precision": 0.375,
1030
+ "recall": 0.5
1031
+ },
1032
+ "eval_accuracy": 0.9658639523336644,
1033
+ "eval_accuracy-all": 0.9746772591857001,
1034
+ "eval_accuracy-das": 0.9833664349553128,
1035
+ "eval_accuracy-l1": 0.971077457795432,
1036
+ "eval_accuracy-l1l2": 0.9664846077457795,
1037
+ "eval_accuracy-l2": 0.9782770605759682,
1038
+ "eval_f1": 0.9711776626885835,
1039
+ "eval_f1-all": 0.9657484331730068,
1040
+ "eval_f1-das": 0.9778769287971741,
1041
+ "eval_f1-l1": 0.9648529028898724,
1042
+ "eval_f1-l1l2": 0.9700633275762809,
1043
+ "eval_f1-l2": 0.966887417218543,
1044
+ "eval_loss": 0.1273569017648697,
1045
+ "eval_precision": 0.9698673262873847,
1046
+ "eval_precision-all": 0.959177764910249,
1047
+ "eval_precision-das": 0.9758812615955473,
1048
+ "eval_precision-l1": 0.9571280991735537,
1049
+ "eval_precision-l1l2": 0.9647867162897223,
1050
+ "eval_precision-l2": 0.9617918313570487,
1051
+ "eval_recall": 0.9724915445321308,
1052
+ "eval_recall-all": 0.9724097446433813,
1053
+ "eval_recall-das": 0.9798807749627422,
1054
+ "eval_recall-l1": 0.9727034120734908,
1055
+ "eval_recall-l1l2": 0.975397973950796,
1056
+ "eval_recall-l2": 0.9720372836218375,
1057
+ "eval_runtime": 6.084,
1058
+ "eval_samples_per_second": 111.111,
1059
+ "eval_steps_per_second": 7.068,
1060
+ "step": 1000
1061
+ },
1062
+ {
1063
+ "epoch": 2.89,
1064
+ "eval_ACT": {
1065
+ "f1": 0.9563567362428842,
1066
+ "number": 519,
1067
+ "precision": 0.9420560747663551,
1068
+ "recall": 0.9710982658959537
1069
+ },
1070
+ "eval_ACT_L1": {
1071
+ "f1": 0.9782608695652174,
1072
+ "number": 503,
1073
+ "precision": 0.9724950884086444,
1074
+ "recall": 0.9840954274353877
1075
+ },
1076
+ "eval_ACT_L2": {
1077
+ "f1": 0.4285714285714286,
1078
+ "number": 16,
1079
+ "precision": 0.34615384615384615,
1080
+ "recall": 0.5625
1081
+ },
1082
+ "eval_CARDINAL": {
1083
+ "f1": 0.9933677229182019,
1084
+ "number": 678,
1085
+ "precision": 0.9926362297496318,
1086
+ "recall": 0.9941002949852508
1087
+ },
1088
+ "eval_DESC": {
1089
+ "f1": 0.5070422535211268,
1090
+ "number": 30,
1091
+ "precision": 0.43902439024390244,
1092
+ "recall": 0.6
1093
+ },
1094
+ "eval_FT": {
1095
+ "f1": 0.36363636363636365,
1096
+ "number": 7,
1097
+ "precision": 0.5,
1098
+ "recall": 0.2857142857142857
1099
+ },
1100
+ "eval_LOC": {
1101
+ "f1": 0.9713541666666666,
1102
+ "number": 762,
1103
+ "precision": 0.9638242894056848,
1104
+ "recall": 0.979002624671916
1105
+ },
1106
+ "eval_PER": {
1107
+ "f1": 0.9859778597785979,
1108
+ "number": 676,
1109
+ "precision": 0.9837997054491899,
1110
+ "recall": 0.9881656804733728
1111
+ },
1112
+ "eval_SPAT": {
1113
+ "f1": 0.9654676258992806,
1114
+ "number": 694,
1115
+ "precision": 0.9640804597701149,
1116
+ "recall": 0.9668587896253602
1117
+ },
1118
+ "eval_TITRE": {
1119
+ "f1": 0.0,
1120
+ "number": 2,
1121
+ "precision": 0.0,
1122
+ "recall": 0.0
1123
+ },
1124
+ "eval_TITREH": {
1125
+ "f1": 0.9696969696969697,
1126
+ "number": 33,
1127
+ "precision": 0.9696969696969697,
1128
+ "recall": 0.9696969696969697
1129
+ },
1130
+ "eval_TITREP": {
1131
+ "f1": 0.42857142857142855,
1132
+ "number": 6,
1133
+ "precision": 0.375,
1134
+ "recall": 0.5
1135
+ },
1136
+ "eval_accuracy": 0.9636295928500497,
1137
+ "eval_accuracy-all": 0.9731256206554121,
1138
+ "eval_accuracy-das": 0.9812562065541212,
1139
+ "eval_accuracy-l1": 0.9700844091360477,
1140
+ "eval_accuracy-l1l2": 0.964746772591857,
1141
+ "eval_accuracy-l2": 0.9761668321747765,
1142
+ "eval_f1": 0.9710437710437709,
1143
+ "eval_f1-all": 0.9679113185530922,
1144
+ "eval_f1-das": 0.9770114942528736,
1145
+ "eval_f1-l1": 0.9671018276762402,
1146
+ "eval_f1-l1l2": 0.9714039373473201,
1147
+ "eval_f1-l2": 0.9689358889623265,
1148
+ "eval_loss": 0.15453395247459412,
1149
+ "eval_precision": 0.9667039106145251,
1150
+ "eval_precision-all": 0.9620179762249927,
1151
+ "eval_precision-das": 0.9723247232472325,
1152
+ "eval_precision-l1": 0.9620779220779221,
1153
+ "eval_precision-l1l2": 0.9646118721461188,
1154
+ "eval_precision-l2": 0.9619422572178478,
1155
+ "eval_recall": 0.9754227733934611,
1156
+ "eval_recall-all": 0.9738773114176695,
1157
+ "eval_recall-das": 0.9817436661698957,
1158
+ "eval_recall-l1": 0.9721784776902888,
1159
+ "eval_recall-l1l2": 0.9782923299565847,
1160
+ "eval_recall-l2": 0.9760319573901465,
1161
+ "eval_runtime": 6.429,
1162
+ "eval_samples_per_second": 105.148,
1163
+ "eval_steps_per_second": 6.688,
1164
+ "step": 1100
1165
+ },
1166
+ {
1167
+ "epoch": 3.15,
1168
+ "eval_ACT": {
1169
+ "f1": 0.9466666666666668,
1170
+ "number": 519,
1171
+ "precision": 0.935969868173258,
1172
+ "recall": 0.9576107899807321
1173
+ },
1174
+ "eval_ACT_L1": {
1175
+ "f1": 0.9674234945705825,
1176
+ "number": 503,
1177
+ "precision": 0.9607843137254902,
1178
+ "recall": 0.974155069582505
1179
+ },
1180
+ "eval_ACT_L2": {
1181
+ "f1": 0.37837837837837834,
1182
+ "number": 16,
1183
+ "precision": 0.3333333333333333,
1184
+ "recall": 0.4375
1185
+ },
1186
+ "eval_CARDINAL": {
1187
+ "f1": 0.9933774834437086,
1188
+ "number": 678,
1189
+ "precision": 0.9911894273127754,
1190
+ "recall": 0.995575221238938
1191
+ },
1192
+ "eval_DESC": {
1193
+ "f1": 0.547945205479452,
1194
+ "number": 30,
1195
+ "precision": 0.46511627906976744,
1196
+ "recall": 0.6666666666666666
1197
+ },
1198
+ "eval_FT": {
1199
+ "f1": 0.4615384615384615,
1200
+ "number": 7,
1201
+ "precision": 0.5,
1202
+ "recall": 0.42857142857142855
1203
+ },
1204
+ "eval_LOC": {
1205
+ "f1": 0.9647979139504563,
1206
+ "number": 762,
1207
+ "precision": 0.9585492227979274,
1208
+ "recall": 0.9711286089238845
1209
+ },
1210
+ "eval_PER": {
1211
+ "f1": 0.9881656804733728,
1212
+ "number": 676,
1213
+ "precision": 0.9881656804733728,
1214
+ "recall": 0.9881656804733728
1215
+ },
1216
+ "eval_SPAT": {
1217
+ "f1": 0.9691756272401433,
1218
+ "number": 694,
1219
+ "precision": 0.9643366619115549,
1220
+ "recall": 0.9740634005763689
1221
+ },
1222
+ "eval_TITRE": {
1223
+ "f1": 0.0,
1224
+ "number": 2,
1225
+ "precision": 0.0,
1226
+ "recall": 0.0
1227
+ },
1228
+ "eval_TITREH": {
1229
+ "f1": 0.9393939393939394,
1230
+ "number": 33,
1231
+ "precision": 0.9393939393939394,
1232
+ "recall": 0.9393939393939394
1233
+ },
1234
+ "eval_TITREP": {
1235
+ "f1": 0.6,
1236
+ "number": 6,
1237
+ "precision": 0.75,
1238
+ "recall": 0.5
1239
+ },
1240
+ "eval_accuracy": 0.964746772591857,
1241
+ "eval_accuracy-all": 0.9746151936444886,
1242
+ "eval_accuracy-das": 0.9803872889771599,
1243
+ "eval_accuracy-l1": 0.9708291956305859,
1244
+ "eval_accuracy-l1l2": 0.9652432969215492,
1245
+ "eval_accuracy-l2": 0.9784011916583912,
1246
+ "eval_f1": 0.9706774519716885,
1247
+ "eval_f1-all": 0.9667347534286548,
1248
+ "eval_f1-das": 0.9745589600742803,
1249
+ "eval_f1-l1": 0.9668839634941329,
1250
+ "eval_f1-l1l2": 0.9678068410462776,
1251
+ "eval_f1-l2": 0.9665452136469029,
1252
+ "eval_loss": 0.14055882394313812,
1253
+ "eval_precision": 0.9673085535154501,
1254
+ "eval_precision-all": 0.9611256164780969,
1255
+ "eval_precision-das": 0.9714920399851906,
1256
+ "eval_precision-l1": 0.960621761658031,
1257
+ "eval_precision-l1l2": 0.96117613474165,
1258
+ "eval_precision-l2": 0.961766644693474,
1259
+ "eval_recall": 0.9740698985343855,
1260
+ "eval_recall-all": 0.9724097446433813,
1261
+ "eval_recall-das": 0.977645305514158,
1262
+ "eval_recall-l1": 0.9732283464566929,
1263
+ "eval_recall-l1l2": 0.9745296671490593,
1264
+ "eval_recall-l2": 0.9713715046604527,
1265
+ "eval_runtime": 5.9342,
1266
+ "eval_samples_per_second": 113.916,
1267
+ "eval_steps_per_second": 7.246,
1268
+ "step": 1200
1269
+ },
1270
+ {
1271
+ "epoch": 3.41,
1272
+ "eval_ACT": {
1273
+ "f1": 0.9363295880149812,
1274
+ "number": 519,
1275
+ "precision": 0.9107468123861566,
1276
+ "recall": 0.9633911368015414
1277
+ },
1278
+ "eval_ACT_L1": {
1279
+ "f1": 0.9591439688715954,
1280
+ "number": 503,
1281
+ "precision": 0.939047619047619,
1282
+ "recall": 0.9801192842942346
1283
+ },
1284
+ "eval_ACT_L2": {
1285
+ "f1": 0.35000000000000003,
1286
+ "number": 16,
1287
+ "precision": 0.2916666666666667,
1288
+ "recall": 0.4375
1289
+ },
1290
+ "eval_CARDINAL": {
1291
+ "f1": 0.9933774834437086,
1292
+ "number": 678,
1293
+ "precision": 0.9911894273127754,
1294
+ "recall": 0.995575221238938
1295
+ },
1296
+ "eval_DESC": {
1297
+ "f1": 0.43037974683544306,
1298
+ "number": 30,
1299
+ "precision": 0.3469387755102041,
1300
+ "recall": 0.5666666666666667
1301
+ },
1302
+ "eval_FT": {
1303
+ "f1": 0.42857142857142855,
1304
+ "number": 7,
1305
+ "precision": 0.42857142857142855,
1306
+ "recall": 0.42857142857142855
1307
+ },
1308
+ "eval_LOC": {
1309
+ "f1": 0.9636363636363636,
1310
+ "number": 762,
1311
+ "precision": 0.9537275064267352,
1312
+ "recall": 0.973753280839895
1313
+ },
1314
+ "eval_PER": {
1315
+ "f1": 0.9845246868091379,
1316
+ "number": 676,
1317
+ "precision": 0.9809104258443465,
1318
+ "recall": 0.9881656804733728
1319
+ },
1320
+ "eval_SPAT": {
1321
+ "f1": 0.9707351891506067,
1322
+ "number": 694,
1323
+ "precision": 0.9618104667609618,
1324
+ "recall": 0.9798270893371758
1325
+ },
1326
+ "eval_TITRE": {
1327
+ "f1": 0.0,
1328
+ "number": 2,
1329
+ "precision": 0.0,
1330
+ "recall": 0.0
1331
+ },
1332
+ "eval_TITREH": {
1333
+ "f1": 0.9253731343283583,
1334
+ "number": 33,
1335
+ "precision": 0.9117647058823529,
1336
+ "recall": 0.9393939393939394
1337
+ },
1338
+ "eval_TITREP": {
1339
+ "f1": 0.42857142857142855,
1340
+ "number": 6,
1341
+ "precision": 0.375,
1342
+ "recall": 0.5
1343
+ },
1344
+ "eval_accuracy": 0.967974180734856,
1345
+ "eval_accuracy-all": 0.9767254220456802,
1346
+ "eval_accuracy-das": 0.9826216484607746,
1347
+ "eval_accuracy-l1": 0.9735600794438928,
1348
+ "eval_accuracy-l1l2": 0.9685948361469712,
1349
+ "eval_accuracy-l2": 0.9798907646474677,
1350
+ "eval_f1": 0.9691876750700281,
1351
+ "eval_f1-all": 0.961889581220113,
1352
+ "eval_f1-das": 0.9733333333333334,
1353
+ "eval_f1-l1": 0.960951642099819,
1354
+ "eval_f1-l1l2": 0.9658928059615935,
1355
+ "eval_f1-l2": 0.963085036255768,
1356
+ "eval_loss": 0.13519717752933502,
1357
+ "eval_precision": 0.9632516703786191,
1358
+ "eval_precision-all": 0.9499141385231826,
1359
+ "eval_precision-das": 0.96759941089838,
1360
+ "eval_precision-l1": 0.9469928644240571,
1361
+ "eval_precision-l1l2": 0.9565711041725802,
1362
+ "eval_precision-l2": 0.9536553524804178,
1363
+ "eval_recall": 0.9751972942502819,
1364
+ "eval_recall-all": 0.9741708247725271,
1365
+ "eval_recall-das": 0.9791356184798807,
1366
+ "eval_recall-l1": 0.9753280839895013,
1367
+ "eval_recall-l1l2": 0.975397973950796,
1368
+ "eval_recall-l2": 0.9727030625832224,
1369
+ "eval_runtime": 6.3863,
1370
+ "eval_samples_per_second": 105.852,
1371
+ "eval_steps_per_second": 6.733,
1372
+ "step": 1300
1373
+ },
1374
+ {
1375
+ "epoch": 3.67,
1376
+ "eval_ACT": {
1377
+ "f1": 0.9461756373937679,
1378
+ "number": 519,
1379
+ "precision": 0.9277777777777778,
1380
+ "recall": 0.9653179190751445
1381
+ },
1382
+ "eval_ACT_L1": {
1383
+ "f1": 0.9686274509803922,
1384
+ "number": 503,
1385
+ "precision": 0.9555125725338491,
1386
+ "recall": 0.9821073558648111
1387
+ },
1388
+ "eval_ACT_L2": {
1389
+ "f1": 0.358974358974359,
1390
+ "number": 16,
1391
+ "precision": 0.30434782608695654,
1392
+ "recall": 0.4375
1393
+ },
1394
+ "eval_CARDINAL": {
1395
+ "f1": 0.9933774834437086,
1396
+ "number": 678,
1397
+ "precision": 0.9911894273127754,
1398
+ "recall": 0.995575221238938
1399
+ },
1400
+ "eval_DESC": {
1401
+ "f1": 0.5507246376811593,
1402
+ "number": 30,
1403
+ "precision": 0.48717948717948717,
1404
+ "recall": 0.6333333333333333
1405
+ },
1406
+ "eval_FT": {
1407
+ "f1": 0.5,
1408
+ "number": 7,
1409
+ "precision": 0.6,
1410
+ "recall": 0.42857142857142855
1411
+ },
1412
+ "eval_LOC": {
1413
+ "f1": 0.9679529103989535,
1414
+ "number": 762,
1415
+ "precision": 0.9647979139504563,
1416
+ "recall": 0.9711286089238845
1417
+ },
1418
+ "eval_PER": {
1419
+ "f1": 0.9881656804733728,
1420
+ "number": 676,
1421
+ "precision": 0.9881656804733728,
1422
+ "recall": 0.9881656804733728
1423
+ },
1424
+ "eval_SPAT": {
1425
+ "f1": 0.9727403156384505,
1426
+ "number": 694,
1427
+ "precision": 0.9685714285714285,
1428
+ "recall": 0.9769452449567724
1429
+ },
1430
+ "eval_TITRE": {
1431
+ "f1": 0.0,
1432
+ "number": 2,
1433
+ "precision": 0.0,
1434
+ "recall": 0.0
1435
+ },
1436
+ "eval_TITREH": {
1437
+ "f1": 0.9696969696969697,
1438
+ "number": 33,
1439
+ "precision": 0.9696969696969697,
1440
+ "recall": 0.9696969696969697
1441
+ },
1442
+ "eval_TITREP": {
1443
+ "f1": 0.4615384615384615,
1444
+ "number": 6,
1445
+ "precision": 0.42857142857142855,
1446
+ "recall": 0.5
1447
+ },
1448
+ "eval_accuracy": 0.9664846077457795,
1449
+ "eval_accuracy-all": 0.9749255213505462,
1450
+ "eval_accuracy-das": 0.9826216484607746,
1451
+ "eval_accuracy-l1": 0.9723187686196624,
1452
+ "eval_accuracy-l1l2": 0.9669811320754716,
1453
+ "eval_accuracy-l2": 0.97753227408143,
1454
+ "eval_f1": 0.9732283464566929,
1455
+ "eval_f1-all": 0.9683442742523706,
1456
+ "eval_f1-das": 0.9756912228613843,
1457
+ "eval_f1-l1": 0.9689861871253583,
1458
+ "eval_f1-l1l2": 0.9711981566820277,
1459
+ "eval_f1-l2": 0.9675281643472498,
1460
+ "eval_loss": 0.1356203556060791,
1461
+ "eval_precision": 0.971043771043771,
1462
+ "eval_precision-all": 0.9625870069605569,
1463
+ "eval_precision-das": 0.9719038817005545,
1464
+ "eval_precision-l1": 0.9622153209109731,
1465
+ "eval_precision-l1l2": 0.9664660361134996,
1466
+ "eval_precision-l2": 0.9630606860158312,
1467
+ "eval_recall": 0.9754227733934611,
1468
+ "eval_recall-all": 0.9741708247725271,
1469
+ "eval_recall-das": 0.9795081967213115,
1470
+ "eval_recall-l1": 0.9758530183727034,
1471
+ "eval_recall-l1l2": 0.9759768451519537,
1472
+ "eval_recall-l2": 0.9720372836218375,
1473
+ "eval_runtime": 7.0867,
1474
+ "eval_samples_per_second": 95.39,
1475
+ "eval_steps_per_second": 6.068,
1476
+ "step": 1400
1477
+ }
1478
+ ],
1479
+ "max_steps": 5000,
1480
+ "num_train_epochs": 14,
1481
+ "total_flos": 564085470663792.0,
1482
+ "trial_name": null,
1483
+ "trial_params": null
1484
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf5b7bef3e97fe154a638a70f49a7795e99302caebf2ef1a5caf5e066ae236e9
3
+ size 3567