nlpso commited on
Commit
305673d
1 Parent(s): e3e5292

Load model and tokenizer

Browse files
config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Jean-Baptiste/camembert-ner",
3
+ "architectures": [
4
+ "CamembertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 5,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 6,
10
+ "gradient_checkpointing": false,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "O+O",
16
+ "1": "I-PER+O",
17
+ "2": "I-PER+i_TITREH",
18
+ "3": "I-ACT+O",
19
+ "4": "I-DESC+O",
20
+ "5": "I-DESC+i_ACT",
21
+ "6": "I-DESC+i_TITREP",
22
+ "7": "I-SPAT+O",
23
+ "8": "I-SPAT+i_LOC",
24
+ "9": "I-SPAT+i_CARDINAL",
25
+ "10": "I-SPAT+i_FT",
26
+ "11": "I-TITRE+O"
27
+ },
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 3072,
30
+ "label2id": {
31
+ "I-ACT+O": 3,
32
+ "I-DESC+O": 4,
33
+ "I-DESC+i_ACT": 5,
34
+ "I-DESC+i_TITREP": 6,
35
+ "I-PER+O": 1,
36
+ "I-PER+i_TITREH": 2,
37
+ "I-SPAT+O": 7,
38
+ "I-SPAT+i_CARDINAL": 9,
39
+ "I-SPAT+i_FT": 10,
40
+ "I-SPAT+i_LOC": 8,
41
+ "I-TITRE+O": 11,
42
+ "O+O": 0
43
+ },
44
+ "layer_norm_eps": 1e-05,
45
+ "max_position_embeddings": 514,
46
+ "model_type": "camembert",
47
+ "num_attention_heads": 12,
48
+ "num_hidden_layers": 12,
49
+ "output_past": true,
50
+ "pad_token_id": 1,
51
+ "position_embedding_type": "absolute",
52
+ "torch_dtype": "float32",
53
+ "transformers_version": "4.25.1",
54
+ "type_vocab_size": 1,
55
+ "use_cache": true,
56
+ "vocab_size": 32005
57
+ }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba2fdcfb204bdad224a8affe18ac1701ac72acb6ac8f94e0742c209df0d76f77
3
+ size 880440037
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85095a03d7c562fae938116eeea585d664ac49e5ddf74f391a2845219556084e
3
+ size 440233393
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fda1dd7aa2f1e9a485b5f20ef345078a9f371592a8eaa31a7d9896f79f644128
3
+ size 14503
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51041b89734cb38f61e5930792b2813f44d4562e4b27ac1f3179a1197589a078
3
+ size 623
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:988bc5a00281c6d210a5d34bd143d0363741a432fefe741bf71e61b1869d4314
3
+ size 810912
special_tokens_map.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": "<mask>",
10
+ "pad_token": "<pad>",
11
+ "sep_token": "</s>",
12
+ "unk_token": "<unk>"
13
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": {
10
+ "__type": "AddedToken",
11
+ "content": "<mask>",
12
+ "lstrip": true,
13
+ "normalized": true,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ "model_max_length": 512,
18
+ "name_or_path": "Jean-Baptiste/camembert-ner",
19
+ "pad_token": "<pad>",
20
+ "sep_token": "</s>",
21
+ "sp_model_kwargs": {},
22
+ "special_tokens_map_file": "/lrde/home2/stual/.cache/huggingface/hub/models--Jean-Baptiste--camembert-ner/snapshots/9f8b2203b6a2daba1ad279ac2adb822518caa167/special_tokens_map.json",
23
+ "tokenizer_class": "CamembertTokenizer",
24
+ "unk_token": "<unk>"
25
+ }
trainer_state.json ADDED
@@ -0,0 +1,2040 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9654571843251089,
3
+ "best_model_checkpoint": "/work/stual/res_ICDAR/method_2/tmp/221-camembert-ner-joint-labelling-io/checkpoint-2000",
4
+ "epoch": 5.2493438320209975,
5
+ "global_step": 2000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.26,
12
+ "eval_ACT": {
13
+ "f1": 0.8818604651162791,
14
+ "number": 519,
15
+ "precision": 0.8525179856115108,
16
+ "recall": 0.9132947976878613
17
+ },
18
+ "eval_ACT_L1": {
19
+ "f1": 0.8951841359773371,
20
+ "number": 503,
21
+ "precision": 0.8525179856115108,
22
+ "recall": 0.9423459244532804
23
+ },
24
+ "eval_ACT_L2": {
25
+ "f1": 0.0,
26
+ "number": 16,
27
+ "precision": 0.0,
28
+ "recall": 0.0
29
+ },
30
+ "eval_CARDINAL": {
31
+ "f1": 0.9765739385065886,
32
+ "number": 678,
33
+ "precision": 0.9694767441860465,
34
+ "recall": 0.9837758112094396
35
+ },
36
+ "eval_DESC": {
37
+ "f1": 0.0,
38
+ "number": 30,
39
+ "precision": 0.0,
40
+ "recall": 0.0
41
+ },
42
+ "eval_FT": {
43
+ "f1": 0.0,
44
+ "number": 7,
45
+ "precision": 0.0,
46
+ "recall": 0.0
47
+ },
48
+ "eval_LOC": {
49
+ "f1": 0.9248704663212436,
50
+ "number": 761,
51
+ "precision": 0.9118773946360154,
52
+ "recall": 0.938239159001314
53
+ },
54
+ "eval_PER": {
55
+ "f1": 0.9236417033773863,
56
+ "number": 676,
57
+ "precision": 0.9169096209912536,
58
+ "recall": 0.9304733727810651
59
+ },
60
+ "eval_SPAT": {
61
+ "f1": 0.9313304721030043,
62
+ "number": 694,
63
+ "precision": 0.9247159090909091,
64
+ "recall": 0.9380403458213257
65
+ },
66
+ "eval_TITRE": {
67
+ "f1": 0.0,
68
+ "number": 2,
69
+ "precision": 0.0,
70
+ "recall": 0.0
71
+ },
72
+ "eval_TITREH": {
73
+ "f1": 0.0,
74
+ "number": 33,
75
+ "precision": 0.0,
76
+ "recall": 0.0
77
+ },
78
+ "eval_TITREP": {
79
+ "f1": 0.0,
80
+ "number": 6,
81
+ "precision": 0.0,
82
+ "recall": 0.0
83
+ },
84
+ "eval_accuracy": 0.931030118957226,
85
+ "eval_accuracy-all": 0.9533029612756264,
86
+ "eval_accuracy-das": 0.9460895975702354,
87
+ "eval_accuracy-l1": 0.9406479372310808,
88
+ "eval_accuracy-l2": 0.9659579853201721,
89
+ "eval_f1": 0.9194107452339687,
90
+ "eval_f1-all": 0.9189506082368459,
91
+ "eval_f1-das": 0.9173768062245277,
92
+ "eval_f1-l1": 0.910932225396001,
93
+ "eval_f1-l2": 0.9293405114401078,
94
+ "eval_loss": 0.3786505162715912,
95
+ "eval_precision": 0.9136050516647531,
96
+ "eval_precision-all": 0.9174714661984197,
97
+ "eval_precision-das": 0.9126428308145964,
98
+ "eval_precision-l1": 0.9013360739979445,
99
+ "eval_precision-l2": 0.938817131203263,
100
+ "eval_recall": 0.9252906976744186,
101
+ "eval_recall-all": 0.9204345273047563,
102
+ "eval_recall-das": 0.9221601489757915,
103
+ "eval_recall-l1": 0.920734908136483,
104
+ "eval_recall-l2": 0.9200532978014657,
105
+ "eval_runtime": 5.4791,
106
+ "eval_samples_per_second": 123.379,
107
+ "eval_steps_per_second": 7.848,
108
+ "step": 100
109
+ },
110
+ {
111
+ "epoch": 0.52,
112
+ "eval_ACT": {
113
+ "f1": 0.8797061524334251,
114
+ "number": 519,
115
+ "precision": 0.8403508771929824,
116
+ "recall": 0.9229287090558767
117
+ },
118
+ "eval_ACT_L1": {
119
+ "f1": 0.8928238583410996,
120
+ "number": 503,
121
+ "precision": 0.8403508771929824,
122
+ "recall": 0.952286282306163
123
+ },
124
+ "eval_ACT_L2": {
125
+ "f1": 0.0,
126
+ "number": 16,
127
+ "precision": 0.0,
128
+ "recall": 0.0
129
+ },
130
+ "eval_CARDINAL": {
131
+ "f1": 0.9773557341124909,
132
+ "number": 678,
133
+ "precision": 0.9681620839363242,
134
+ "recall": 0.9867256637168141
135
+ },
136
+ "eval_DESC": {
137
+ "f1": 0.09523809523809522,
138
+ "number": 30,
139
+ "precision": 0.16666666666666666,
140
+ "recall": 0.06666666666666667
141
+ },
142
+ "eval_FT": {
143
+ "f1": 0.0,
144
+ "number": 7,
145
+ "precision": 0.0,
146
+ "recall": 0.0
147
+ },
148
+ "eval_LOC": {
149
+ "f1": 0.9347123464770524,
150
+ "number": 761,
151
+ "precision": 0.9198473282442748,
152
+ "recall": 0.9500657030223391
153
+ },
154
+ "eval_PER": {
155
+ "f1": 0.9285187914517319,
156
+ "number": 676,
157
+ "precision": 0.9251101321585903,
158
+ "recall": 0.9319526627218935
159
+ },
160
+ "eval_SPAT": {
161
+ "f1": 0.9212207239176721,
162
+ "number": 694,
163
+ "precision": 0.9076923076923077,
164
+ "recall": 0.9351585014409222
165
+ },
166
+ "eval_TITRE": {
167
+ "f1": 0.0,
168
+ "number": 2,
169
+ "precision": 0.0,
170
+ "recall": 0.0
171
+ },
172
+ "eval_TITREH": {
173
+ "f1": 0.0,
174
+ "number": 33,
175
+ "precision": 0.0,
176
+ "recall": 0.0
177
+ },
178
+ "eval_TITREP": {
179
+ "f1": 0.0,
180
+ "number": 6,
181
+ "precision": 0.0,
182
+ "recall": 0.0
183
+ },
184
+ "eval_accuracy": 0.9339407744874715,
185
+ "eval_accuracy-all": 0.9529865856745128,
186
+ "eval_accuracy-das": 0.9482409516578082,
187
+ "eval_accuracy-l1": 0.9407744874715261,
188
+ "eval_accuracy-l2": 0.9651986838774994,
189
+ "eval_f1": 0.9257654534950897,
190
+ "eval_f1-all": 0.9188164990526161,
191
+ "eval_f1-das": 0.9222242748937742,
192
+ "eval_f1-l1": 0.9065155807365439,
193
+ "eval_f1-l2": 0.9348556077904635,
194
+ "eval_loss": 0.2861093580722809,
195
+ "eval_precision": 0.9199196326061998,
196
+ "eval_precision-all": 0.912301013024602,
197
+ "eval_precision-das": 0.9149560117302052,
198
+ "eval_precision-l1": 0.8897876643073812,
199
+ "eval_precision-l2": 0.942450914014895,
200
+ "eval_recall": 0.9316860465116279,
201
+ "eval_recall-all": 0.9254257193188491,
202
+ "eval_recall-das": 0.929608938547486,
203
+ "eval_recall-l1": 0.9238845144356955,
204
+ "eval_recall-l2": 0.927381745502998,
205
+ "eval_runtime": 5.893,
206
+ "eval_samples_per_second": 114.712,
207
+ "eval_steps_per_second": 7.297,
208
+ "step": 200
209
+ },
210
+ {
211
+ "epoch": 0.79,
212
+ "eval_ACT": {
213
+ "f1": 0.9220532319391636,
214
+ "number": 519,
215
+ "precision": 0.9099437148217636,
216
+ "recall": 0.9344894026974951
217
+ },
218
+ "eval_ACT_L1": {
219
+ "f1": 0.9362934362934364,
220
+ "number": 503,
221
+ "precision": 0.9099437148217636,
222
+ "recall": 0.9642147117296223
223
+ },
224
+ "eval_ACT_L2": {
225
+ "f1": 0.0,
226
+ "number": 16,
227
+ "precision": 0.0,
228
+ "recall": 0.0
229
+ },
230
+ "eval_CARDINAL": {
231
+ "f1": 0.9860396767083027,
232
+ "number": 678,
233
+ "precision": 0.9824304538799414,
234
+ "recall": 0.9896755162241888
235
+ },
236
+ "eval_DESC": {
237
+ "f1": 0.27450980392156865,
238
+ "number": 30,
239
+ "precision": 0.3333333333333333,
240
+ "recall": 0.23333333333333334
241
+ },
242
+ "eval_FT": {
243
+ "f1": 0.0,
244
+ "number": 7,
245
+ "precision": 0.0,
246
+ "recall": 0.0
247
+ },
248
+ "eval_LOC": {
249
+ "f1": 0.9346405228758171,
250
+ "number": 761,
251
+ "precision": 0.929778933680104,
252
+ "recall": 0.9395532194480947
253
+ },
254
+ "eval_PER": {
255
+ "f1": 0.9381443298969072,
256
+ "number": 676,
257
+ "precision": 0.9340175953079178,
258
+ "recall": 0.9423076923076923
259
+ },
260
+ "eval_SPAT": {
261
+ "f1": 0.9430199430199431,
262
+ "number": 694,
263
+ "precision": 0.9323943661971831,
264
+ "recall": 0.9538904899135446
265
+ },
266
+ "eval_TITRE": {
267
+ "f1": 0.0,
268
+ "number": 2,
269
+ "precision": 0.0,
270
+ "recall": 0.0
271
+ },
272
+ "eval_TITREH": {
273
+ "f1": 0.17777777777777776,
274
+ "number": 33,
275
+ "precision": 0.3333333333333333,
276
+ "recall": 0.12121212121212122
277
+ },
278
+ "eval_TITREP": {
279
+ "f1": 0.0,
280
+ "number": 6,
281
+ "precision": 0.0,
282
+ "recall": 0.0
283
+ },
284
+ "eval_accuracy": 0.9472285497342445,
285
+ "eval_accuracy-all": 0.9614654517843584,
286
+ "eval_accuracy-das": 0.9639331814730449,
287
+ "eval_accuracy-l1": 0.9538091622374083,
288
+ "eval_accuracy-l2": 0.9691217413313086,
289
+ "eval_f1": 0.9426157879405767,
290
+ "eval_f1-all": 0.9333920187793427,
291
+ "eval_f1-das": 0.9416153702667412,
292
+ "eval_f1-l1": 0.9301480135029863,
293
+ "eval_f1-l2": 0.9376053962900506,
294
+ "eval_loss": 0.22815603017807007,
295
+ "eval_precision": 0.9445417396380619,
296
+ "eval_precision-all": 0.9328445747800587,
297
+ "eval_precision-das": 0.9431988041853513,
298
+ "eval_precision-l1": 0.920349434737924,
299
+ "eval_precision-l2": 0.9494535519125683,
300
+ "eval_recall": 0.9406976744186046,
301
+ "eval_recall-all": 0.9339401056958309,
302
+ "eval_recall-das": 0.9400372439478585,
303
+ "eval_recall-l1": 0.9401574803149606,
304
+ "eval_recall-l2": 0.9260493004663558,
305
+ "eval_runtime": 6.5502,
306
+ "eval_samples_per_second": 103.203,
307
+ "eval_steps_per_second": 6.565,
308
+ "step": 300
309
+ },
310
+ {
311
+ "epoch": 1.05,
312
+ "eval_ACT": {
313
+ "f1": 0.9244019138755981,
314
+ "number": 519,
315
+ "precision": 0.9182509505703422,
316
+ "recall": 0.930635838150289
317
+ },
318
+ "eval_ACT_L1": {
319
+ "f1": 0.9448818897637794,
320
+ "number": 503,
321
+ "precision": 0.935672514619883,
322
+ "recall": 0.9542743538767395
323
+ },
324
+ "eval_ACT_L2": {
325
+ "f1": 0.20689655172413793,
326
+ "number": 16,
327
+ "precision": 0.23076923076923078,
328
+ "recall": 0.1875
329
+ },
330
+ "eval_CARDINAL": {
331
+ "f1": 0.9874723655121592,
332
+ "number": 678,
333
+ "precision": 0.9867452135493373,
334
+ "recall": 0.9882005899705014
335
+ },
336
+ "eval_DESC": {
337
+ "f1": 0.28235294117647064,
338
+ "number": 30,
339
+ "precision": 0.21818181818181817,
340
+ "recall": 0.4
341
+ },
342
+ "eval_FT": {
343
+ "f1": 0.0,
344
+ "number": 7,
345
+ "precision": 0.0,
346
+ "recall": 0.0
347
+ },
348
+ "eval_LOC": {
349
+ "f1": 0.9488859764089123,
350
+ "number": 761,
351
+ "precision": 0.9464052287581699,
352
+ "recall": 0.9513797634691196
353
+ },
354
+ "eval_PER": {
355
+ "f1": 0.951683748169839,
356
+ "number": 676,
357
+ "precision": 0.9420289855072463,
358
+ "recall": 0.9615384615384616
359
+ },
360
+ "eval_SPAT": {
361
+ "f1": 0.9491768074445239,
362
+ "number": 694,
363
+ "precision": 0.9431009957325747,
364
+ "recall": 0.9553314121037464
365
+ },
366
+ "eval_TITRE": {
367
+ "f1": 0.0,
368
+ "number": 2,
369
+ "precision": 0.0,
370
+ "recall": 0.0
371
+ },
372
+ "eval_TITREH": {
373
+ "f1": 0.5263157894736842,
374
+ "number": 33,
375
+ "precision": 0.625,
376
+ "recall": 0.45454545454545453
377
+ },
378
+ "eval_TITREP": {
379
+ "f1": 0.0,
380
+ "number": 6,
381
+ "precision": 0.0,
382
+ "recall": 0.0
383
+ },
384
+ "eval_accuracy": 0.9395089850670716,
385
+ "eval_accuracy-all": 0.9572892938496583,
386
+ "eval_accuracy-das": 0.9578587699316629,
387
+ "eval_accuracy-l1": 0.9484940521386991,
388
+ "eval_accuracy-l2": 0.9660845355606176,
389
+ "eval_f1": 0.9442109839153746,
390
+ "eval_f1-all": 0.9395443925233645,
391
+ "eval_f1-das": 0.9498415066194295,
392
+ "eval_f1-l1": 0.933781686497672,
393
+ "eval_f1-l2": 0.9470154258886653,
394
+ "eval_loss": 0.19686226546764374,
395
+ "eval_precision": 0.9413464316671483,
396
+ "eval_precision-all": 0.9346310284718187,
397
+ "eval_precision-das": 0.9510828976848394,
398
+ "eval_precision-l1": 0.9204487506374299,
399
+ "eval_precision-l2": 0.9534098582039163,
400
+ "eval_recall": 0.9470930232558139,
401
+ "eval_recall-all": 0.9445096887844979,
402
+ "eval_recall-das": 0.9486033519553073,
403
+ "eval_recall-l1": 0.94750656167979,
404
+ "eval_recall-l2": 0.9407061958694204,
405
+ "eval_runtime": 6.1906,
406
+ "eval_samples_per_second": 109.198,
407
+ "eval_steps_per_second": 6.946,
408
+ "step": 400
409
+ },
410
+ {
411
+ "epoch": 1.31,
412
+ "learning_rate": 9e-05,
413
+ "loss": 0.3718,
414
+ "step": 500
415
+ },
416
+ {
417
+ "epoch": 1.31,
418
+ "eval_ACT": {
419
+ "f1": 0.9380362249761677,
420
+ "number": 519,
421
+ "precision": 0.9283018867924528,
422
+ "recall": 0.9479768786127167
423
+ },
424
+ "eval_ACT_L1": {
425
+ "f1": 0.952565343659245,
426
+ "number": 503,
427
+ "precision": 0.9283018867924528,
428
+ "recall": 0.9781312127236581
429
+ },
430
+ "eval_ACT_L2": {
431
+ "f1": 0.0,
432
+ "number": 16,
433
+ "precision": 0.0,
434
+ "recall": 0.0
435
+ },
436
+ "eval_CARDINAL": {
437
+ "f1": 0.986019131714496,
438
+ "number": 678,
439
+ "precision": 0.9838472834067548,
440
+ "recall": 0.9882005899705014
441
+ },
442
+ "eval_DESC": {
443
+ "f1": 0.23809523809523808,
444
+ "number": 30,
445
+ "precision": 0.4166666666666667,
446
+ "recall": 0.16666666666666666
447
+ },
448
+ "eval_FT": {
449
+ "f1": 0.0,
450
+ "number": 7,
451
+ "precision": 0.0,
452
+ "recall": 0.0
453
+ },
454
+ "eval_LOC": {
455
+ "f1": 0.945645055664702,
456
+ "number": 761,
457
+ "precision": 0.9425587467362925,
458
+ "recall": 0.9487516425755584
459
+ },
460
+ "eval_PER": {
461
+ "f1": 0.9683124539425203,
462
+ "number": 676,
463
+ "precision": 0.9647577092511013,
464
+ "recall": 0.9718934911242604
465
+ },
466
+ "eval_SPAT": {
467
+ "f1": 0.9472182596291013,
468
+ "number": 694,
469
+ "precision": 0.9378531073446328,
470
+ "recall": 0.9567723342939481
471
+ },
472
+ "eval_TITRE": {
473
+ "f1": 0.0,
474
+ "number": 2,
475
+ "precision": 0.0,
476
+ "recall": 0.0
477
+ },
478
+ "eval_TITREH": {
479
+ "f1": 0.8181818181818182,
480
+ "number": 33,
481
+ "precision": 0.8181818181818182,
482
+ "recall": 0.8181818181818182
483
+ },
484
+ "eval_TITREP": {
485
+ "f1": 0.25,
486
+ "number": 6,
487
+ "precision": 0.5,
488
+ "recall": 0.16666666666666666
489
+ },
490
+ "eval_accuracy": 0.9534295115160719,
491
+ "eval_accuracy-all": 0.9654517843583903,
492
+ "eval_accuracy-das": 0.9665907365223994,
493
+ "eval_accuracy-l1": 0.958744621614781,
494
+ "eval_accuracy-l2": 0.9721589471019995,
495
+ "eval_f1": 0.9550021843599825,
496
+ "eval_f1-all": 0.9496993694090042,
497
+ "eval_f1-das": 0.9570552147239264,
498
+ "eval_f1-l1": 0.9478623566214807,
499
+ "eval_f1-l2": 0.9520616828695944,
500
+ "eval_loss": 0.18782156705856323,
501
+ "eval_precision": 0.9568135395389553,
502
+ "eval_precision-all": 0.9487254614708468,
503
+ "eval_precision-das": 0.955456570155902,
504
+ "eval_precision-l1": 0.9414810978767478,
505
+ "eval_precision-l2": 0.9581646423751687,
506
+ "eval_recall": 0.9531976744186047,
507
+ "eval_recall-all": 0.9506752789195537,
508
+ "eval_recall-das": 0.958659217877095,
509
+ "eval_recall-l1": 0.9543307086614173,
510
+ "eval_recall-l2": 0.9460359760159893,
511
+ "eval_runtime": 6.174,
512
+ "eval_samples_per_second": 109.491,
513
+ "eval_steps_per_second": 6.965,
514
+ "step": 500
515
+ },
516
+ {
517
+ "epoch": 1.57,
518
+ "eval_ACT": {
519
+ "f1": 0.9334600760456274,
520
+ "number": 519,
521
+ "precision": 0.9212007504690432,
522
+ "recall": 0.9460500963391136
523
+ },
524
+ "eval_ACT_L1": {
525
+ "f1": 0.9468599033816425,
526
+ "number": 503,
527
+ "precision": 0.9210526315789473,
528
+ "recall": 0.974155069582505
529
+ },
530
+ "eval_ACT_L2": {
531
+ "f1": 0.11764705882352941,
532
+ "number": 16,
533
+ "precision": 1.0,
534
+ "recall": 0.0625
535
+ },
536
+ "eval_CARDINAL": {
537
+ "f1": 0.9867452135493373,
538
+ "number": 678,
539
+ "precision": 0.9852941176470589,
540
+ "recall": 0.9882005899705014
541
+ },
542
+ "eval_DESC": {
543
+ "f1": 0.3333333333333333,
544
+ "number": 30,
545
+ "precision": 0.3333333333333333,
546
+ "recall": 0.3333333333333333
547
+ },
548
+ "eval_FT": {
549
+ "f1": 0.0,
550
+ "number": 7,
551
+ "precision": 0.0,
552
+ "recall": 0.0
553
+ },
554
+ "eval_LOC": {
555
+ "f1": 0.9490403706154864,
556
+ "number": 761,
557
+ "precision": 0.956,
558
+ "recall": 0.9421813403416557
559
+ },
560
+ "eval_PER": {
561
+ "f1": 0.9572271386430679,
562
+ "number": 676,
563
+ "precision": 0.9544117647058824,
564
+ "recall": 0.9600591715976331
565
+ },
566
+ "eval_SPAT": {
567
+ "f1": 0.9538904899135446,
568
+ "number": 694,
569
+ "precision": 0.9538904899135446,
570
+ "recall": 0.9538904899135446
571
+ },
572
+ "eval_TITRE": {
573
+ "f1": 0.0,
574
+ "number": 2,
575
+ "precision": 0.0,
576
+ "recall": 0.0
577
+ },
578
+ "eval_TITREH": {
579
+ "f1": 0.6153846153846154,
580
+ "number": 33,
581
+ "precision": 0.625,
582
+ "recall": 0.6060606060606061
583
+ },
584
+ "eval_TITREP": {
585
+ "f1": 0.4444444444444444,
586
+ "number": 6,
587
+ "precision": 0.6666666666666666,
588
+ "recall": 0.3333333333333333
589
+ },
590
+ "eval_accuracy": 0.9544419134396356,
591
+ "eval_accuracy-all": 0.9670969374841812,
592
+ "eval_accuracy-das": 0.9669703872437357,
593
+ "eval_accuracy-l1": 0.960642875221463,
594
+ "eval_accuracy-l2": 0.9735509997468995,
595
+ "eval_f1": 0.9518265172463979,
596
+ "eval_f1-all": 0.9462397179788484,
597
+ "eval_f1-das": 0.952807312068644,
598
+ "eval_f1-l1": 0.9429835980213485,
599
+ "eval_f1-l2": 0.9504550050556118,
600
+ "eval_loss": 0.1709740161895752,
601
+ "eval_precision": 0.9530749052754299,
602
+ "eval_precision-all": 0.9467960023515579,
603
+ "eval_precision-das": 0.9544095665171899,
604
+ "eval_precision-l1": 0.9354338842975206,
605
+ "eval_precision-l2": 0.9618008185538881,
606
+ "eval_recall": 0.9505813953488372,
607
+ "eval_recall-all": 0.9456840869054609,
608
+ "eval_recall-das": 0.9512104283054004,
609
+ "eval_recall-l1": 0.9506561679790027,
610
+ "eval_recall-l2": 0.9393737508327782,
611
+ "eval_runtime": 6.1402,
612
+ "eval_samples_per_second": 110.094,
613
+ "eval_steps_per_second": 7.003,
614
+ "step": 600
615
+ },
616
+ {
617
+ "epoch": 1.84,
618
+ "eval_ACT": {
619
+ "f1": 0.9339712918660287,
620
+ "number": 519,
621
+ "precision": 0.9277566539923955,
622
+ "recall": 0.9402697495183044
623
+ },
624
+ "eval_ACT_L1": {
625
+ "f1": 0.9536031589338598,
626
+ "number": 503,
627
+ "precision": 0.9470588235294117,
628
+ "recall": 0.9602385685884692
629
+ },
630
+ "eval_ACT_L2": {
631
+ "f1": 0.3125,
632
+ "number": 16,
633
+ "precision": 0.3125,
634
+ "recall": 0.3125
635
+ },
636
+ "eval_CARDINAL": {
637
+ "f1": 0.9867647058823529,
638
+ "number": 678,
639
+ "precision": 0.9838709677419355,
640
+ "recall": 0.9896755162241888
641
+ },
642
+ "eval_DESC": {
643
+ "f1": 0.5,
644
+ "number": 30,
645
+ "precision": 0.47058823529411764,
646
+ "recall": 0.5333333333333333
647
+ },
648
+ "eval_FT": {
649
+ "f1": 0.0,
650
+ "number": 7,
651
+ "precision": 0.0,
652
+ "recall": 0.0
653
+ },
654
+ "eval_LOC": {
655
+ "f1": 0.9457161543492479,
656
+ "number": 761,
657
+ "precision": 0.94140625,
658
+ "recall": 0.9500657030223391
659
+ },
660
+ "eval_PER": {
661
+ "f1": 0.9711324944485566,
662
+ "number": 676,
663
+ "precision": 0.9718518518518519,
664
+ "recall": 0.9704142011834319
665
+ },
666
+ "eval_SPAT": {
667
+ "f1": 0.9611510791366907,
668
+ "number": 694,
669
+ "precision": 0.9597701149425287,
670
+ "recall": 0.962536023054755
671
+ },
672
+ "eval_TITRE": {
673
+ "f1": 0.0,
674
+ "number": 2,
675
+ "precision": 0.0,
676
+ "recall": 0.0
677
+ },
678
+ "eval_TITREH": {
679
+ "f1": 0.9032258064516129,
680
+ "number": 33,
681
+ "precision": 0.9655172413793104,
682
+ "recall": 0.8484848484848485
683
+ },
684
+ "eval_TITREP": {
685
+ "f1": 0.2857142857142857,
686
+ "number": 6,
687
+ "precision": 1.0,
688
+ "recall": 0.16666666666666666
689
+ },
690
+ "eval_accuracy": 0.95292331055429,
691
+ "eval_accuracy-all": 0.9641862819539357,
692
+ "eval_accuracy-das": 0.9721589471019995,
693
+ "eval_accuracy-l1": 0.9586180713743356,
694
+ "eval_accuracy-l2": 0.9697544925335359,
695
+ "eval_f1": 0.9564586357039186,
696
+ "eval_f1-all": 0.9537919906117059,
697
+ "eval_f1-das": 0.9595827900912646,
698
+ "eval_f1-l1": 0.9544502617801047,
699
+ "eval_f1-l2": 0.9529529529529529,
700
+ "eval_loss": 0.16730760037899017,
701
+ "eval_precision": 0.9550724637681159,
702
+ "eval_precision-all": 0.9530929346232776,
703
+ "eval_precision-das": 0.9597615499254843,
704
+ "eval_precision-l1": 0.951958224543081,
705
+ "eval_precision-l2": 0.9545454545454546,
706
+ "eval_recall": 0.9578488372093024,
707
+ "eval_recall-all": 0.9544920728126834,
708
+ "eval_recall-das": 0.9594040968342644,
709
+ "eval_recall-l1": 0.9569553805774278,
710
+ "eval_recall-l2": 0.9513657561625583,
711
+ "eval_runtime": 6.0205,
712
+ "eval_samples_per_second": 112.283,
713
+ "eval_steps_per_second": 7.142,
714
+ "step": 700
715
+ },
716
+ {
717
+ "epoch": 2.1,
718
+ "eval_ACT": {
719
+ "f1": 0.9249762583095916,
720
+ "number": 519,
721
+ "precision": 0.9119850187265918,
722
+ "recall": 0.9383429672447013
723
+ },
724
+ "eval_ACT_L1": {
725
+ "f1": 0.9545454545454545,
726
+ "number": 503,
727
+ "precision": 0.9489194499017681,
728
+ "recall": 0.9602385685884692
729
+ },
730
+ "eval_ACT_L2": {
731
+ "f1": 0.19512195121951217,
732
+ "number": 16,
733
+ "precision": 0.16,
734
+ "recall": 0.25
735
+ },
736
+ "eval_CARDINAL": {
737
+ "f1": 0.9851851851851852,
738
+ "number": 678,
739
+ "precision": 0.9895833333333334,
740
+ "recall": 0.9808259587020649
741
+ },
742
+ "eval_DESC": {
743
+ "f1": 0.4347826086956522,
744
+ "number": 30,
745
+ "precision": 0.38461538461538464,
746
+ "recall": 0.5
747
+ },
748
+ "eval_FT": {
749
+ "f1": 0.0,
750
+ "number": 7,
751
+ "precision": 0.0,
752
+ "recall": 0.0
753
+ },
754
+ "eval_LOC": {
755
+ "f1": 0.9516971279373369,
756
+ "number": 761,
757
+ "precision": 0.9455252918287937,
758
+ "recall": 0.9579500657030223
759
+ },
760
+ "eval_PER": {
761
+ "f1": 0.9748892171344165,
762
+ "number": 676,
763
+ "precision": 0.9734513274336283,
764
+ "recall": 0.9763313609467456
765
+ },
766
+ "eval_SPAT": {
767
+ "f1": 0.9342857142857142,
768
+ "number": 694,
769
+ "precision": 0.9263456090651558,
770
+ "recall": 0.9423631123919308
771
+ },
772
+ "eval_TITRE": {
773
+ "f1": 0.0,
774
+ "number": 2,
775
+ "precision": 0.0,
776
+ "recall": 0.0
777
+ },
778
+ "eval_TITREH": {
779
+ "f1": 0.8656716417910447,
780
+ "number": 33,
781
+ "precision": 0.8529411764705882,
782
+ "recall": 0.8787878787878788
783
+ },
784
+ "eval_TITREP": {
785
+ "f1": 0.5,
786
+ "number": 6,
787
+ "precision": 1.0,
788
+ "recall": 0.3333333333333333
789
+ },
790
+ "eval_accuracy": 0.9510250569476082,
791
+ "eval_accuracy-all": 0.9619083776259175,
792
+ "eval_accuracy-das": 0.9702606934953176,
793
+ "eval_accuracy-l1": 0.9567198177676538,
794
+ "eval_accuracy-l2": 0.9670969374841812,
795
+ "eval_f1": 0.955323469683783,
796
+ "eval_f1-all": 0.9473838059047063,
797
+ "eval_f1-das": 0.9587053571428571,
798
+ "eval_f1-l1": 0.9444878811571541,
799
+ "eval_f1-l2": 0.95108153078203,
800
+ "eval_loss": 0.1715497374534607,
801
+ "eval_precision": 0.9533873769542559,
802
+ "eval_precision-all": 0.9432479627473807,
803
+ "eval_precision-das": 0.9576365663322185,
804
+ "eval_precision-l1": 0.937888198757764,
805
+ "eval_precision-l2": 0.9501329787234043,
806
+ "eval_recall": 0.9572674418604651,
807
+ "eval_recall-all": 0.9515560775102759,
808
+ "eval_recall-das": 0.9597765363128492,
809
+ "eval_recall-l1": 0.9511811023622048,
810
+ "eval_recall-l2": 0.9520319786808794,
811
+ "eval_runtime": 6.0149,
812
+ "eval_samples_per_second": 112.387,
813
+ "eval_steps_per_second": 7.149,
814
+ "step": 800
815
+ },
816
+ {
817
+ "epoch": 2.36,
818
+ "eval_ACT": {
819
+ "f1": 0.9271523178807947,
820
+ "number": 519,
821
+ "precision": 0.9107806691449815,
822
+ "recall": 0.9441233140655106
823
+ },
824
+ "eval_ACT_L1": {
825
+ "f1": 0.9500489715964741,
826
+ "number": 503,
827
+ "precision": 0.9362934362934363,
828
+ "recall": 0.9642147117296223
829
+ },
830
+ "eval_ACT_L2": {
831
+ "f1": 0.2777777777777778,
832
+ "number": 16,
833
+ "precision": 0.25,
834
+ "recall": 0.3125
835
+ },
836
+ "eval_CARDINAL": {
837
+ "f1": 0.9816581071166545,
838
+ "number": 678,
839
+ "precision": 0.9766423357664233,
840
+ "recall": 0.9867256637168141
841
+ },
842
+ "eval_DESC": {
843
+ "f1": 0.39473684210526316,
844
+ "number": 30,
845
+ "precision": 0.32608695652173914,
846
+ "recall": 0.5
847
+ },
848
+ "eval_FT": {
849
+ "f1": 0.0,
850
+ "number": 7,
851
+ "precision": 0.0,
852
+ "recall": 0.0
853
+ },
854
+ "eval_LOC": {
855
+ "f1": 0.9455022980958635,
856
+ "number": 761,
857
+ "precision": 0.9448818897637795,
858
+ "recall": 0.9461235216819974
859
+ },
860
+ "eval_PER": {
861
+ "f1": 0.9763663220088628,
862
+ "number": 676,
863
+ "precision": 0.9749262536873157,
864
+ "recall": 0.977810650887574
865
+ },
866
+ "eval_SPAT": {
867
+ "f1": 0.9526542324246772,
868
+ "number": 694,
869
+ "precision": 0.9485714285714286,
870
+ "recall": 0.9567723342939481
871
+ },
872
+ "eval_TITRE": {
873
+ "f1": 0.0,
874
+ "number": 2,
875
+ "precision": 0.0,
876
+ "recall": 0.0
877
+ },
878
+ "eval_TITREH": {
879
+ "f1": 0.823529411764706,
880
+ "number": 33,
881
+ "precision": 0.8,
882
+ "recall": 0.8484848484848485
883
+ },
884
+ "eval_TITREP": {
885
+ "f1": 0.3333333333333333,
886
+ "number": 6,
887
+ "precision": 0.3333333333333333,
888
+ "recall": 0.3333333333333333
889
+ },
890
+ "eval_accuracy": 0.9524171095925082,
891
+ "eval_accuracy-all": 0.9633637053910402,
892
+ "eval_accuracy-das": 0.9712730954188813,
893
+ "eval_accuracy-l1": 0.9593773728170083,
894
+ "eval_accuracy-l2": 0.9673500379650721,
895
+ "eval_f1": 0.9529599073672022,
896
+ "eval_f1-all": 0.9477829638273045,
897
+ "eval_f1-das": 0.9574902543159458,
898
+ "eval_f1-l1": 0.9487912659214973,
899
+ "eval_f1-l2": 0.9464938517779994,
900
+ "eval_loss": 0.15614591538906097,
901
+ "eval_precision": 0.9489766503315077,
902
+ "eval_precision-all": 0.9417391304347826,
903
+ "eval_precision-das": 0.9544781643227239,
904
+ "eval_precision-l1": 0.9397528321318228,
905
+ "eval_precision-l2": 0.9442970822281167,
906
+ "eval_recall": 0.9569767441860465,
907
+ "eval_recall-all": 0.953904873752202,
908
+ "eval_recall-das": 0.9605214152700187,
909
+ "eval_recall-l1": 0.958005249343832,
910
+ "eval_recall-l2": 0.9487008660892738,
911
+ "eval_runtime": 6.5502,
912
+ "eval_samples_per_second": 103.202,
913
+ "eval_steps_per_second": 6.565,
914
+ "step": 900
915
+ },
916
+ {
917
+ "epoch": 2.62,
918
+ "learning_rate": 8e-05,
919
+ "loss": 0.1448,
920
+ "step": 1000
921
+ },
922
+ {
923
+ "epoch": 2.62,
924
+ "eval_ACT": {
925
+ "f1": 0.9319470699432891,
926
+ "number": 519,
927
+ "precision": 0.9146567717996289,
928
+ "recall": 0.9499036608863198
929
+ },
930
+ "eval_ACT_L1": {
931
+ "f1": 0.9547244094488189,
932
+ "number": 503,
933
+ "precision": 0.9454191033138402,
934
+ "recall": 0.9642147117296223
935
+ },
936
+ "eval_ACT_L2": {
937
+ "f1": 0.380952380952381,
938
+ "number": 16,
939
+ "precision": 0.3076923076923077,
940
+ "recall": 0.5
941
+ },
942
+ "eval_CARDINAL": {
943
+ "f1": 0.9852941176470589,
944
+ "number": 678,
945
+ "precision": 0.9824046920821115,
946
+ "recall": 0.9882005899705014
947
+ },
948
+ "eval_DESC": {
949
+ "f1": 0.45569620253164556,
950
+ "number": 30,
951
+ "precision": 0.3673469387755102,
952
+ "recall": 0.6
953
+ },
954
+ "eval_FT": {
955
+ "f1": 0.0,
956
+ "number": 7,
957
+ "precision": 0.0,
958
+ "recall": 0.0
959
+ },
960
+ "eval_LOC": {
961
+ "f1": 0.9586342744583061,
962
+ "number": 761,
963
+ "precision": 0.958005249343832,
964
+ "recall": 0.9592641261498029
965
+ },
966
+ "eval_PER": {
967
+ "f1": 0.9719350073855243,
968
+ "number": 676,
969
+ "precision": 0.9705014749262537,
970
+ "recall": 0.9733727810650887
971
+ },
972
+ "eval_SPAT": {
973
+ "f1": 0.9469914040114613,
974
+ "number": 694,
975
+ "precision": 0.9415954415954416,
976
+ "recall": 0.952449567723343
977
+ },
978
+ "eval_TITRE": {
979
+ "f1": 0.0,
980
+ "number": 2,
981
+ "precision": 0.0,
982
+ "recall": 0.0
983
+ },
984
+ "eval_TITREH": {
985
+ "f1": 0.7692307692307692,
986
+ "number": 33,
987
+ "precision": 0.78125,
988
+ "recall": 0.7575757575757576
989
+ },
990
+ "eval_TITREP": {
991
+ "f1": 0.4444444444444444,
992
+ "number": 6,
993
+ "precision": 0.6666666666666666,
994
+ "recall": 0.3333333333333333
995
+ },
996
+ "eval_accuracy": 0.9536826119969628,
997
+ "eval_accuracy-all": 0.9634902556314857,
998
+ "eval_accuracy-das": 0.9735509997468995,
999
+ "eval_accuracy-l1": 0.9593773728170083,
1000
+ "eval_accuracy-l2": 0.967603138445963,
1001
+ "eval_f1": 0.958689665168865,
1002
+ "eval_f1-all": 0.9505326134539618,
1003
+ "eval_f1-das": 0.9622466059140785,
1004
+ "eval_f1-l1": 0.9472316090460099,
1005
+ "eval_f1-l2": 0.9547571523619428,
1006
+ "eval_loss": 0.16222244501113892,
1007
+ "eval_precision": 0.9560566637756577,
1008
+ "eval_precision-all": 0.944879605454018,
1009
+ "eval_precision-das": 0.9609955423476969,
1010
+ "eval_precision-l1": 0.9382080329557158,
1011
+ "eval_precision-l2": 0.9534883720930233,
1012
+ "eval_recall": 0.9613372093023256,
1013
+ "eval_recall-all": 0.956253669994128,
1014
+ "eval_recall-das": 0.9635009310986965,
1015
+ "eval_recall-l1": 0.9564304461942257,
1016
+ "eval_recall-l2": 0.9560293137908061,
1017
+ "eval_runtime": 5.8166,
1018
+ "eval_samples_per_second": 116.219,
1019
+ "eval_steps_per_second": 7.393,
1020
+ "step": 1000
1021
+ },
1022
+ {
1023
+ "epoch": 2.89,
1024
+ "eval_ACT": {
1025
+ "f1": 0.9426386233269598,
1026
+ "number": 519,
1027
+ "precision": 0.9354838709677419,
1028
+ "recall": 0.9499036608863198
1029
+ },
1030
+ "eval_ACT_L1": {
1031
+ "f1": 0.9614243323442137,
1032
+ "number": 503,
1033
+ "precision": 0.9566929133858267,
1034
+ "recall": 0.9662027833001988
1035
+ },
1036
+ "eval_ACT_L2": {
1037
+ "f1": 0.39999999999999997,
1038
+ "number": 16,
1039
+ "precision": 0.3684210526315789,
1040
+ "recall": 0.4375
1041
+ },
1042
+ "eval_CARDINAL": {
1043
+ "f1": 0.9882179675994109,
1044
+ "number": 678,
1045
+ "precision": 0.986764705882353,
1046
+ "recall": 0.9896755162241888
1047
+ },
1048
+ "eval_DESC": {
1049
+ "f1": 0.5217391304347826,
1050
+ "number": 30,
1051
+ "precision": 0.46153846153846156,
1052
+ "recall": 0.6
1053
+ },
1054
+ "eval_FT": {
1055
+ "f1": 0.0,
1056
+ "number": 7,
1057
+ "precision": 0.0,
1058
+ "recall": 0.0
1059
+ },
1060
+ "eval_LOC": {
1061
+ "f1": 0.9420949902407288,
1062
+ "number": 761,
1063
+ "precision": 0.9329896907216495,
1064
+ "recall": 0.9513797634691196
1065
+ },
1066
+ "eval_PER": {
1067
+ "f1": 0.9770879526977089,
1068
+ "number": 676,
1069
+ "precision": 0.9763663220088626,
1070
+ "recall": 0.977810650887574
1071
+ },
1072
+ "eval_SPAT": {
1073
+ "f1": 0.9577060931899642,
1074
+ "number": 694,
1075
+ "precision": 0.9529243937232525,
1076
+ "recall": 0.962536023054755
1077
+ },
1078
+ "eval_TITRE": {
1079
+ "f1": 0.0,
1080
+ "number": 2,
1081
+ "precision": 0.0,
1082
+ "recall": 0.0
1083
+ },
1084
+ "eval_TITREH": {
1085
+ "f1": 0.8,
1086
+ "number": 33,
1087
+ "precision": 0.8125,
1088
+ "recall": 0.7878787878787878
1089
+ },
1090
+ "eval_TITREP": {
1091
+ "f1": 0.4,
1092
+ "number": 6,
1093
+ "precision": 0.3333333333333333,
1094
+ "recall": 0.5
1095
+ },
1096
+ "eval_accuracy": 0.9539357124778537,
1097
+ "eval_accuracy-all": 0.9638699063528221,
1098
+ "eval_accuracy-das": 0.9727916983042267,
1099
+ "eval_accuracy-l1": 0.9610225259427992,
1100
+ "eval_accuracy-l2": 0.9667172867628449,
1101
+ "eval_f1": 0.9571883135666762,
1102
+ "eval_f1-all": 0.9534102526654009,
1103
+ "eval_f1-das": 0.9606533036377134,
1104
+ "eval_f1-l1": 0.9571801566579634,
1105
+ "eval_f1-l2": 0.9486244613854822,
1106
+ "eval_loss": 0.17501647770404816,
1107
+ "eval_precision": 0.9525043177892919,
1108
+ "eval_precision-all": 0.948561464690497,
1109
+ "eval_precision-das": 0.9574546799852016,
1110
+ "eval_precision-l1": 0.9522077922077922,
1111
+ "eval_precision-l2": 0.9439313984168866,
1112
+ "eval_recall": 0.9619186046511627,
1113
+ "eval_recall-all": 0.9583088667058133,
1114
+ "eval_recall-das": 0.9638733705772812,
1115
+ "eval_recall-l1": 0.9622047244094488,
1116
+ "eval_recall-l2": 0.9533644237175216,
1117
+ "eval_runtime": 6.2615,
1118
+ "eval_samples_per_second": 107.961,
1119
+ "eval_steps_per_second": 6.867,
1120
+ "step": 1100
1121
+ },
1122
+ {
1123
+ "epoch": 3.15,
1124
+ "eval_ACT": {
1125
+ "f1": 0.9417382999044891,
1126
+ "number": 519,
1127
+ "precision": 0.9337121212121212,
1128
+ "recall": 0.9499036608863198
1129
+ },
1130
+ "eval_ACT_L1": {
1131
+ "f1": 0.9594460929772503,
1132
+ "number": 503,
1133
+ "precision": 0.9547244094488189,
1134
+ "recall": 0.9642147117296223
1135
+ },
1136
+ "eval_ACT_L2": {
1137
+ "f1": 0.4444444444444445,
1138
+ "number": 16,
1139
+ "precision": 0.4,
1140
+ "recall": 0.5
1141
+ },
1142
+ "eval_CARDINAL": {
1143
+ "f1": 0.9867647058823529,
1144
+ "number": 678,
1145
+ "precision": 0.9838709677419355,
1146
+ "recall": 0.9896755162241888
1147
+ },
1148
+ "eval_DESC": {
1149
+ "f1": 0.45454545454545453,
1150
+ "number": 30,
1151
+ "precision": 0.4166666666666667,
1152
+ "recall": 0.5
1153
+ },
1154
+ "eval_FT": {
1155
+ "f1": 0.0,
1156
+ "number": 7,
1157
+ "precision": 0.0,
1158
+ "recall": 0.0
1159
+ },
1160
+ "eval_LOC": {
1161
+ "f1": 0.9510763209393347,
1162
+ "number": 761,
1163
+ "precision": 0.944300518134715,
1164
+ "recall": 0.9579500657030223
1165
+ },
1166
+ "eval_PER": {
1167
+ "f1": 0.9785661492978566,
1168
+ "number": 676,
1169
+ "precision": 0.9778434268833087,
1170
+ "recall": 0.9792899408284024
1171
+ },
1172
+ "eval_SPAT": {
1173
+ "f1": 0.9562096195262024,
1174
+ "number": 694,
1175
+ "precision": 0.9527896995708155,
1176
+ "recall": 0.9596541786743515
1177
+ },
1178
+ "eval_TITRE": {
1179
+ "f1": 0.0,
1180
+ "number": 2,
1181
+ "precision": 0.0,
1182
+ "recall": 0.0
1183
+ },
1184
+ "eval_TITREH": {
1185
+ "f1": 0.8055555555555556,
1186
+ "number": 33,
1187
+ "precision": 0.7435897435897436,
1188
+ "recall": 0.8787878787878788
1189
+ },
1190
+ "eval_TITREP": {
1191
+ "f1": 0.5454545454545454,
1192
+ "number": 6,
1193
+ "precision": 0.6,
1194
+ "recall": 0.5
1195
+ },
1196
+ "eval_accuracy": 0.9538091622374083,
1197
+ "eval_accuracy-all": 0.9638066312325994,
1198
+ "eval_accuracy-das": 0.9724120475828905,
1199
+ "eval_accuracy-l1": 0.9598835737787902,
1200
+ "eval_accuracy-l2": 0.9677296886864085,
1201
+ "eval_f1": 0.9574775817182528,
1202
+ "eval_f1-all": 0.9549970777323202,
1203
+ "eval_f1-das": 0.9612172944887734,
1204
+ "eval_f1-l1": 0.9558169934640522,
1205
+ "eval_f1-l2": 0.9539582643259357,
1206
+ "eval_loss": 0.17843317985534668,
1207
+ "eval_precision": 0.9527921704087507,
1208
+ "eval_precision-all": 0.9505526468877254,
1209
+ "eval_precision-das": 0.9578402366863905,
1210
+ "eval_precision-l1": 0.9520833333333333,
1211
+ "eval_precision-l2": 0.9486166007905138,
1212
+ "eval_recall": 0.9622093023255814,
1213
+ "eval_recall-all": 0.9594832648267763,
1214
+ "eval_recall-das": 0.9646182495344506,
1215
+ "eval_recall-l1": 0.9595800524934384,
1216
+ "eval_recall-l2": 0.9593604263824117,
1217
+ "eval_runtime": 6.7294,
1218
+ "eval_samples_per_second": 100.455,
1219
+ "eval_steps_per_second": 6.39,
1220
+ "step": 1200
1221
+ },
1222
+ {
1223
+ "epoch": 3.41,
1224
+ "eval_ACT": {
1225
+ "f1": 0.939047619047619,
1226
+ "number": 519,
1227
+ "precision": 0.928436911487759,
1228
+ "recall": 0.9499036608863198
1229
+ },
1230
+ "eval_ACT_L1": {
1231
+ "f1": 0.9576354679802955,
1232
+ "number": 503,
1233
+ "precision": 0.94921875,
1234
+ "recall": 0.9662027833001988
1235
+ },
1236
+ "eval_ACT_L2": {
1237
+ "f1": 0.39999999999999997,
1238
+ "number": 16,
1239
+ "precision": 0.3684210526315789,
1240
+ "recall": 0.4375
1241
+ },
1242
+ "eval_CARDINAL": {
1243
+ "f1": 0.9852724594992636,
1244
+ "number": 678,
1245
+ "precision": 0.9838235294117647,
1246
+ "recall": 0.9867256637168141
1247
+ },
1248
+ "eval_DESC": {
1249
+ "f1": 0.5161290322580646,
1250
+ "number": 30,
1251
+ "precision": 0.5,
1252
+ "recall": 0.5333333333333333
1253
+ },
1254
+ "eval_FT": {
1255
+ "f1": 0.4444444444444445,
1256
+ "number": 7,
1257
+ "precision": 1.0,
1258
+ "recall": 0.2857142857142857
1259
+ },
1260
+ "eval_LOC": {
1261
+ "f1": 0.9546946815495732,
1262
+ "number": 761,
1263
+ "precision": 0.9540682414698163,
1264
+ "recall": 0.9553219448094612
1265
+ },
1266
+ "eval_PER": {
1267
+ "f1": 0.9785661492978566,
1268
+ "number": 676,
1269
+ "precision": 0.9778434268833087,
1270
+ "recall": 0.9792899408284024
1271
+ },
1272
+ "eval_SPAT": {
1273
+ "f1": 0.9569583931133429,
1274
+ "number": 694,
1275
+ "precision": 0.9528571428571428,
1276
+ "recall": 0.9610951008645533
1277
+ },
1278
+ "eval_TITRE": {
1279
+ "f1": 0.0,
1280
+ "number": 2,
1281
+ "precision": 0.0,
1282
+ "recall": 0.0
1283
+ },
1284
+ "eval_TITREH": {
1285
+ "f1": 0.7096774193548386,
1286
+ "number": 33,
1287
+ "precision": 0.7586206896551724,
1288
+ "recall": 0.6666666666666666
1289
+ },
1290
+ "eval_TITREP": {
1291
+ "f1": 0.5,
1292
+ "number": 6,
1293
+ "precision": 0.5,
1294
+ "recall": 0.5
1295
+ },
1296
+ "eval_accuracy": 0.960642875221463,
1297
+ "eval_accuracy-all": 0.9691217413313086,
1298
+ "eval_accuracy-das": 0.9778537079220451,
1299
+ "eval_accuracy-l1": 0.9653252341179448,
1300
+ "eval_accuracy-l2": 0.9729182485446722,
1301
+ "eval_f1": 0.9602562236133353,
1302
+ "eval_f1-all": 0.9556043956043958,
1303
+ "eval_f1-das": 0.9622044312046174,
1304
+ "eval_f1-l1": 0.9571353894406691,
1305
+ "eval_f1-l2": 0.9536512170723576,
1306
+ "eval_loss": 0.16250379383563995,
1307
+ "eval_precision": 0.9617964421114027,
1308
+ "eval_precision-all": 0.9537876572097105,
1309
+ "eval_precision-das": 0.9620253164556962,
1310
+ "eval_precision-l1": 0.9531494013534617,
1311
+ "eval_precision-l2": 0.9546061415220294,
1312
+ "eval_recall": 0.9587209302325581,
1313
+ "eval_recall-all": 0.9574280681150911,
1314
+ "eval_recall-das": 0.9623836126629423,
1315
+ "eval_recall-l1": 0.9611548556430446,
1316
+ "eval_recall-l2": 0.9526982011992006,
1317
+ "eval_runtime": 5.7506,
1318
+ "eval_samples_per_second": 117.554,
1319
+ "eval_steps_per_second": 7.478,
1320
+ "step": 1300
1321
+ },
1322
+ {
1323
+ "epoch": 3.67,
1324
+ "eval_ACT": {
1325
+ "f1": 0.9439696106362773,
1326
+ "number": 519,
1327
+ "precision": 0.9307116104868914,
1328
+ "recall": 0.9576107899807321
1329
+ },
1330
+ "eval_ACT_L1": {
1331
+ "f1": 0.9616519174041297,
1332
+ "number": 503,
1333
+ "precision": 0.9513618677042801,
1334
+ "recall": 0.9721669980119284
1335
+ },
1336
+ "eval_ACT_L2": {
1337
+ "f1": 0.4444444444444445,
1338
+ "number": 16,
1339
+ "precision": 0.4,
1340
+ "recall": 0.5
1341
+ },
1342
+ "eval_CARDINAL": {
1343
+ "f1": 0.9830757910228108,
1344
+ "number": 678,
1345
+ "precision": 0.9809104258443465,
1346
+ "recall": 0.9852507374631269
1347
+ },
1348
+ "eval_DESC": {
1349
+ "f1": 0.4927536231884058,
1350
+ "number": 30,
1351
+ "precision": 0.4358974358974359,
1352
+ "recall": 0.5666666666666667
1353
+ },
1354
+ "eval_FT": {
1355
+ "f1": 0.22222222222222224,
1356
+ "number": 7,
1357
+ "precision": 0.5,
1358
+ "recall": 0.14285714285714285
1359
+ },
1360
+ "eval_LOC": {
1361
+ "f1": 0.9560655737704917,
1362
+ "number": 761,
1363
+ "precision": 0.9541884816753927,
1364
+ "recall": 0.9579500657030223
1365
+ },
1366
+ "eval_PER": {
1367
+ "f1": 0.9807692307692307,
1368
+ "number": 676,
1369
+ "precision": 0.9807692307692307,
1370
+ "recall": 0.9807692307692307
1371
+ },
1372
+ "eval_SPAT": {
1373
+ "f1": 0.9590222861250898,
1374
+ "number": 694,
1375
+ "precision": 0.9569583931133429,
1376
+ "recall": 0.9610951008645533
1377
+ },
1378
+ "eval_TITRE": {
1379
+ "f1": 0.0,
1380
+ "number": 2,
1381
+ "precision": 0.0,
1382
+ "recall": 0.0
1383
+ },
1384
+ "eval_TITREH": {
1385
+ "f1": 0.875,
1386
+ "number": 33,
1387
+ "precision": 0.9032258064516129,
1388
+ "recall": 0.8484848484848485
1389
+ },
1390
+ "eval_TITREP": {
1391
+ "f1": 0.3333333333333333,
1392
+ "number": 6,
1393
+ "precision": 0.3333333333333333,
1394
+ "recall": 0.3333333333333333
1395
+ },
1396
+ "eval_accuracy": 0.9583649708934447,
1397
+ "eval_accuracy-all": 0.9695646671728676,
1398
+ "eval_accuracy-das": 0.9716527461402177,
1399
+ "eval_accuracy-l1": 0.9645659326752721,
1400
+ "eval_accuracy-l2": 0.9745634016704632,
1401
+ "eval_f1": 0.9603128621089224,
1402
+ "eval_f1-all": 0.957284961966062,
1403
+ "eval_f1-das": 0.9644783336432956,
1404
+ "eval_f1-l1": 0.9584964761158966,
1405
+ "eval_f1-l2": 0.9557404326123128,
1406
+ "eval_loss": 0.17416799068450928,
1407
+ "eval_precision": 0.956986143187067,
1408
+ "eval_precision-all": 0.953935860058309,
1409
+ "eval_precision-das": 0.9632243684992571,
1410
+ "eval_precision-l1": 0.9532710280373832,
1411
+ "eval_precision-l2": 0.9547872340425532,
1412
+ "eval_recall": 0.9636627906976745,
1413
+ "eval_recall-all": 0.9606576629477392,
1414
+ "eval_recall-das": 0.9657355679702049,
1415
+ "eval_recall-l1": 0.9637795275590552,
1416
+ "eval_recall-l2": 0.9566955363091273,
1417
+ "eval_runtime": 6.3107,
1418
+ "eval_samples_per_second": 107.119,
1419
+ "eval_steps_per_second": 6.814,
1420
+ "step": 1400
1421
+ },
1422
+ {
1423
+ "epoch": 3.94,
1424
+ "learning_rate": 7e-05,
1425
+ "loss": 0.0854,
1426
+ "step": 1500
1427
+ },
1428
+ {
1429
+ "epoch": 3.94,
1430
+ "eval_ACT": {
1431
+ "f1": 0.9382716049382717,
1432
+ "number": 519,
1433
+ "precision": 0.9250936329588015,
1434
+ "recall": 0.9518304431599229
1435
+ },
1436
+ "eval_ACT_L1": {
1437
+ "f1": 0.9614243323442137,
1438
+ "number": 503,
1439
+ "precision": 0.9566929133858267,
1440
+ "recall": 0.9662027833001988
1441
+ },
1442
+ "eval_ACT_L2": {
1443
+ "f1": 0.380952380952381,
1444
+ "number": 16,
1445
+ "precision": 0.3076923076923077,
1446
+ "recall": 0.5
1447
+ },
1448
+ "eval_CARDINAL": {
1449
+ "f1": 0.9874538745387453,
1450
+ "number": 678,
1451
+ "precision": 0.9881831610044313,
1452
+ "recall": 0.9867256637168141
1453
+ },
1454
+ "eval_DESC": {
1455
+ "f1": 0.5142857142857143,
1456
+ "number": 30,
1457
+ "precision": 0.45,
1458
+ "recall": 0.6
1459
+ },
1460
+ "eval_FT": {
1461
+ "f1": 0.2,
1462
+ "number": 7,
1463
+ "precision": 0.3333333333333333,
1464
+ "recall": 0.14285714285714285
1465
+ },
1466
+ "eval_LOC": {
1467
+ "f1": 0.9559500328731098,
1468
+ "number": 761,
1469
+ "precision": 0.9565789473684211,
1470
+ "recall": 0.9553219448094612
1471
+ },
1472
+ "eval_PER": {
1473
+ "f1": 0.9763313609467456,
1474
+ "number": 676,
1475
+ "precision": 0.9763313609467456,
1476
+ "recall": 0.9763313609467456
1477
+ },
1478
+ "eval_SPAT": {
1479
+ "f1": 0.9577060931899642,
1480
+ "number": 694,
1481
+ "precision": 0.9529243937232525,
1482
+ "recall": 0.962536023054755
1483
+ },
1484
+ "eval_TITRE": {
1485
+ "f1": 0.0,
1486
+ "number": 2,
1487
+ "precision": 0.0,
1488
+ "recall": 0.0
1489
+ },
1490
+ "eval_TITREH": {
1491
+ "f1": 0.8529411764705883,
1492
+ "number": 33,
1493
+ "precision": 0.8285714285714286,
1494
+ "recall": 0.8787878787878788
1495
+ },
1496
+ "eval_TITREP": {
1497
+ "f1": 0.5454545454545454,
1498
+ "number": 6,
1499
+ "precision": 0.6,
1500
+ "recall": 0.5
1501
+ },
1502
+ "eval_accuracy": 0.9515312579093901,
1503
+ "eval_accuracy-all": 0.9630473297899266,
1504
+ "eval_accuracy-das": 0.9717792963806631,
1505
+ "eval_accuracy-l1": 0.9570994684889901,
1506
+ "eval_accuracy-l2": 0.9689951910908631,
1507
+ "eval_f1": 0.9592576482528636,
1508
+ "eval_f1-all": 0.9562673687289747,
1509
+ "eval_f1-das": 0.9624395686128672,
1510
+ "eval_f1-l1": 0.9566579634464752,
1511
+ "eval_f1-l2": 0.9557698703026272,
1512
+ "eval_loss": 0.18355852365493774,
1513
+ "eval_precision": 0.9568990454150998,
1514
+ "eval_precision-all": 0.9527834450597493,
1515
+ "eval_precision-das": 0.961010025993316,
1516
+ "eval_precision-l1": 0.9516883116883117,
1517
+ "eval_precision-l2": 0.954183266932271,
1518
+ "eval_recall": 0.9616279069767442,
1519
+ "eval_recall-all": 0.959776864357017,
1520
+ "eval_recall-das": 0.9638733705772812,
1521
+ "eval_recall-l1": 0.9616797900262467,
1522
+ "eval_recall-l2": 0.9573617588274483,
1523
+ "eval_runtime": 6.1311,
1524
+ "eval_samples_per_second": 110.258,
1525
+ "eval_steps_per_second": 7.013,
1526
+ "step": 1500
1527
+ },
1528
+ {
1529
+ "epoch": 4.2,
1530
+ "eval_ACT": {
1531
+ "f1": 0.9375,
1532
+ "number": 519,
1533
+ "precision": 0.9217877094972067,
1534
+ "recall": 0.953757225433526
1535
+ },
1536
+ "eval_ACT_L1": {
1537
+ "f1": 0.9577187807276303,
1538
+ "number": 503,
1539
+ "precision": 0.9474708171206225,
1540
+ "recall": 0.9681908548707754
1541
+ },
1542
+ "eval_ACT_L2": {
1543
+ "f1": 0.41025641025641024,
1544
+ "number": 16,
1545
+ "precision": 0.34782608695652173,
1546
+ "recall": 0.5
1547
+ },
1548
+ "eval_CARDINAL": {
1549
+ "f1": 0.9874908020603386,
1550
+ "number": 678,
1551
+ "precision": 0.9853157121879589,
1552
+ "recall": 0.9896755162241888
1553
+ },
1554
+ "eval_DESC": {
1555
+ "f1": 0.5217391304347826,
1556
+ "number": 30,
1557
+ "precision": 0.46153846153846156,
1558
+ "recall": 0.6
1559
+ },
1560
+ "eval_FT": {
1561
+ "f1": 0.4615384615384615,
1562
+ "number": 7,
1563
+ "precision": 0.5,
1564
+ "recall": 0.42857142857142855
1565
+ },
1566
+ "eval_LOC": {
1567
+ "f1": 0.953063885267275,
1568
+ "number": 761,
1569
+ "precision": 0.9456662354463131,
1570
+ "recall": 0.9605781865965834
1571
+ },
1572
+ "eval_PER": {
1573
+ "f1": 0.9792899408284024,
1574
+ "number": 676,
1575
+ "precision": 0.9792899408284024,
1576
+ "recall": 0.9792899408284024
1577
+ },
1578
+ "eval_SPAT": {
1579
+ "f1": 0.9592566118656183,
1580
+ "number": 694,
1581
+ "precision": 0.9517730496453901,
1582
+ "recall": 0.9668587896253602
1583
+ },
1584
+ "eval_TITRE": {
1585
+ "f1": 0.5,
1586
+ "number": 2,
1587
+ "precision": 0.5,
1588
+ "recall": 0.5
1589
+ },
1590
+ "eval_TITREH": {
1591
+ "f1": 0.84375,
1592
+ "number": 33,
1593
+ "precision": 0.8709677419354839,
1594
+ "recall": 0.8181818181818182
1595
+ },
1596
+ "eval_TITREP": {
1597
+ "f1": 0.4,
1598
+ "number": 6,
1599
+ "precision": 0.3333333333333333,
1600
+ "recall": 0.5
1601
+ },
1602
+ "eval_accuracy": 0.9557074158440901,
1603
+ "eval_accuracy-all": 0.9666540116426221,
1604
+ "eval_accuracy-das": 0.9732978992660086,
1605
+ "eval_accuracy-l1": 0.9629207795494812,
1606
+ "eval_accuracy-l2": 0.9703872437357631,
1607
+ "eval_f1": 0.959525874530211,
1608
+ "eval_f1-all": 0.9561544064093226,
1609
+ "eval_f1-das": 0.9638286032276017,
1610
+ "eval_f1-l1": 0.9575631346003645,
1611
+ "eval_f1-l2": 0.9543650793650794,
1612
+ "eval_loss": 0.1747445911169052,
1613
+ "eval_precision": 0.9542840713053479,
1614
+ "eval_precision-all": 0.9488291413703382,
1615
+ "eval_precision-das": 0.9600886917960089,
1616
+ "eval_precision-l1": 0.949896694214876,
1617
+ "eval_precision-l2": 0.9474720945502298,
1618
+ "eval_recall": 0.9648255813953488,
1619
+ "eval_recall-all": 0.9635936582501468,
1620
+ "eval_recall-das": 0.9675977653631285,
1621
+ "eval_recall-l1": 0.9653543307086614,
1622
+ "eval_recall-l2": 0.9613590939373751,
1623
+ "eval_runtime": 6.3526,
1624
+ "eval_samples_per_second": 106.414,
1625
+ "eval_steps_per_second": 6.769,
1626
+ "step": 1600
1627
+ },
1628
+ {
1629
+ "epoch": 4.46,
1630
+ "eval_ACT": {
1631
+ "f1": 0.9438629876308278,
1632
+ "number": 519,
1633
+ "precision": 0.9323308270676691,
1634
+ "recall": 0.9556840077071291
1635
+ },
1636
+ "eval_ACT_L1": {
1637
+ "f1": 0.9663366336633663,
1638
+ "number": 503,
1639
+ "precision": 0.9625246548323472,
1640
+ "recall": 0.9701789264413518
1641
+ },
1642
+ "eval_ACT_L2": {
1643
+ "f1": 0.39024390243902435,
1644
+ "number": 16,
1645
+ "precision": 0.32,
1646
+ "recall": 0.5
1647
+ },
1648
+ "eval_CARDINAL": {
1649
+ "f1": 0.9867452135493373,
1650
+ "number": 678,
1651
+ "precision": 0.9852941176470589,
1652
+ "recall": 0.9882005899705014
1653
+ },
1654
+ "eval_DESC": {
1655
+ "f1": 0.5373134328358209,
1656
+ "number": 30,
1657
+ "precision": 0.4864864864864865,
1658
+ "recall": 0.6
1659
+ },
1660
+ "eval_FT": {
1661
+ "f1": 0.0,
1662
+ "number": 7,
1663
+ "precision": 0.0,
1664
+ "recall": 0.0
1665
+ },
1666
+ "eval_LOC": {
1667
+ "f1": 0.9619921363040629,
1668
+ "number": 761,
1669
+ "precision": 0.9594771241830066,
1670
+ "recall": 0.9645203679369251
1671
+ },
1672
+ "eval_PER": {
1673
+ "f1": 0.9792899408284024,
1674
+ "number": 676,
1675
+ "precision": 0.9792899408284024,
1676
+ "recall": 0.9792899408284024
1677
+ },
1678
+ "eval_SPAT": {
1679
+ "f1": 0.9627507163323783,
1680
+ "number": 694,
1681
+ "precision": 0.9572649572649573,
1682
+ "recall": 0.968299711815562
1683
+ },
1684
+ "eval_TITRE": {
1685
+ "f1": 0.0,
1686
+ "number": 2,
1687
+ "precision": 0.0,
1688
+ "recall": 0.0
1689
+ },
1690
+ "eval_TITREH": {
1691
+ "f1": 0.8484848484848486,
1692
+ "number": 33,
1693
+ "precision": 0.8484848484848485,
1694
+ "recall": 0.8484848484848485
1695
+ },
1696
+ "eval_TITREP": {
1697
+ "f1": 0.5454545454545454,
1698
+ "number": 6,
1699
+ "precision": 0.6,
1700
+ "recall": 0.5
1701
+ },
1702
+ "eval_accuracy": 0.9554543153631991,
1703
+ "eval_accuracy-all": 0.9662743609212857,
1704
+ "eval_accuracy-das": 0.975069602632245,
1705
+ "eval_accuracy-l1": 0.9619083776259175,
1706
+ "eval_accuracy-l2": 0.970640344216654,
1707
+ "eval_f1": 0.9615552009284782,
1708
+ "eval_f1-all": 0.9603627321924821,
1709
+ "eval_f1-das": 0.9665178571428571,
1710
+ "eval_f1-l1": 0.9615887117846877,
1711
+ "eval_f1-l2": 0.9588039867109635,
1712
+ "eval_loss": 0.17034310102462769,
1713
+ "eval_precision": 0.9597451491456704,
1714
+ "eval_precision-all": 0.9568638880792771,
1715
+ "eval_precision-das": 0.9654403567447045,
1716
+ "eval_precision-l1": 0.9573361082206036,
1717
+ "eval_precision-l2": 0.9562624254473161,
1718
+ "eval_recall": 0.9633720930232558,
1719
+ "eval_recall-all": 0.9638872577803875,
1720
+ "eval_recall-das": 0.9675977653631285,
1721
+ "eval_recall-l1": 0.9658792650918635,
1722
+ "eval_recall-l2": 0.9613590939373751,
1723
+ "eval_runtime": 6.4585,
1724
+ "eval_samples_per_second": 104.669,
1725
+ "eval_steps_per_second": 6.658,
1726
+ "step": 1700
1727
+ },
1728
+ {
1729
+ "epoch": 4.72,
1730
+ "eval_ACT": {
1731
+ "f1": 0.9551098376313275,
1732
+ "number": 519,
1733
+ "precision": 0.946969696969697,
1734
+ "recall": 0.9633911368015414
1735
+ },
1736
+ "eval_ACT_L1": {
1737
+ "f1": 0.971540726202159,
1738
+ "number": 503,
1739
+ "precision": 0.9593023255813954,
1740
+ "recall": 0.9840954274353877
1741
+ },
1742
+ "eval_ACT_L2": {
1743
+ "f1": 0.35714285714285715,
1744
+ "number": 16,
1745
+ "precision": 0.4166666666666667,
1746
+ "recall": 0.3125
1747
+ },
1748
+ "eval_CARDINAL": {
1749
+ "f1": 0.9867452135493373,
1750
+ "number": 678,
1751
+ "precision": 0.9852941176470589,
1752
+ "recall": 0.9882005899705014
1753
+ },
1754
+ "eval_DESC": {
1755
+ "f1": 0.523076923076923,
1756
+ "number": 30,
1757
+ "precision": 0.4857142857142857,
1758
+ "recall": 0.5666666666666667
1759
+ },
1760
+ "eval_FT": {
1761
+ "f1": 0.42857142857142855,
1762
+ "number": 7,
1763
+ "precision": 0.42857142857142855,
1764
+ "recall": 0.42857142857142855
1765
+ },
1766
+ "eval_LOC": {
1767
+ "f1": 0.945645055664702,
1768
+ "number": 761,
1769
+ "precision": 0.9425587467362925,
1770
+ "recall": 0.9487516425755584
1771
+ },
1772
+ "eval_PER": {
1773
+ "f1": 0.9800148038490007,
1774
+ "number": 676,
1775
+ "precision": 0.9807407407407407,
1776
+ "recall": 0.9792899408284024
1777
+ },
1778
+ "eval_SPAT": {
1779
+ "f1": 0.9463902787705505,
1780
+ "number": 694,
1781
+ "precision": 0.9390070921985816,
1782
+ "recall": 0.9538904899135446
1783
+ },
1784
+ "eval_TITRE": {
1785
+ "f1": 0.0,
1786
+ "number": 2,
1787
+ "precision": 0.0,
1788
+ "recall": 0.0
1789
+ },
1790
+ "eval_TITREH": {
1791
+ "f1": 0.875,
1792
+ "number": 33,
1793
+ "precision": 0.9032258064516129,
1794
+ "recall": 0.8484848484848485
1795
+ },
1796
+ "eval_TITREP": {
1797
+ "f1": 0.30769230769230765,
1798
+ "number": 6,
1799
+ "precision": 0.2857142857142857,
1800
+ "recall": 0.3333333333333333
1801
+ },
1802
+ "eval_accuracy": 0.9596304732978993,
1803
+ "eval_accuracy-all": 0.968299164768413,
1804
+ "eval_accuracy-das": 0.9749430523917996,
1805
+ "eval_accuracy-l1": 0.9654517843583903,
1806
+ "eval_accuracy-l2": 0.9711465451784358,
1807
+ "eval_f1": 0.9605339524085896,
1808
+ "eval_f1-all": 0.9548311650343518,
1809
+ "eval_f1-das": 0.9643255295429208,
1810
+ "eval_f1-l1": 0.9569976544175137,
1811
+ "eval_f1-l2": 0.9520639147802931,
1812
+ "eval_loss": 0.17404037714004517,
1813
+ "eval_precision": 0.958864426419467,
1814
+ "eval_precision-all": 0.9508005822416302,
1815
+ "eval_precision-das": 0.9621802002224694,
1816
+ "eval_precision-l1": 0.9503105590062112,
1817
+ "eval_precision-l2": 0.9514304723885563,
1818
+ "eval_recall": 0.9622093023255814,
1819
+ "eval_recall-all": 0.9588960657662948,
1820
+ "eval_recall-das": 0.9664804469273743,
1821
+ "eval_recall-l1": 0.9637795275590552,
1822
+ "eval_recall-l2": 0.9526982011992006,
1823
+ "eval_runtime": 5.4184,
1824
+ "eval_samples_per_second": 124.761,
1825
+ "eval_steps_per_second": 7.936,
1826
+ "step": 1800
1827
+ },
1828
+ {
1829
+ "epoch": 4.99,
1830
+ "eval_ACT": {
1831
+ "f1": 0.939047619047619,
1832
+ "number": 519,
1833
+ "precision": 0.928436911487759,
1834
+ "recall": 0.9499036608863198
1835
+ },
1836
+ "eval_ACT_L1": {
1837
+ "f1": 0.961576354679803,
1838
+ "number": 503,
1839
+ "precision": 0.953125,
1840
+ "recall": 0.9701789264413518
1841
+ },
1842
+ "eval_ACT_L2": {
1843
+ "f1": 0.2857142857142857,
1844
+ "number": 16,
1845
+ "precision": 0.2631578947368421,
1846
+ "recall": 0.3125
1847
+ },
1848
+ "eval_CARDINAL": {
1849
+ "f1": 0.9815770081061163,
1850
+ "number": 678,
1851
+ "precision": 0.9808541973490427,
1852
+ "recall": 0.9823008849557522
1853
+ },
1854
+ "eval_DESC": {
1855
+ "f1": 0.5483870967741935,
1856
+ "number": 30,
1857
+ "precision": 0.53125,
1858
+ "recall": 0.5666666666666667
1859
+ },
1860
+ "eval_FT": {
1861
+ "f1": 0.2,
1862
+ "number": 7,
1863
+ "precision": 0.3333333333333333,
1864
+ "recall": 0.14285714285714285
1865
+ },
1866
+ "eval_LOC": {
1867
+ "f1": 0.953063885267275,
1868
+ "number": 761,
1869
+ "precision": 0.9456662354463131,
1870
+ "recall": 0.9605781865965834
1871
+ },
1872
+ "eval_PER": {
1873
+ "f1": 0.977810650887574,
1874
+ "number": 676,
1875
+ "precision": 0.977810650887574,
1876
+ "recall": 0.977810650887574
1877
+ },
1878
+ "eval_SPAT": {
1879
+ "f1": 0.9626972740315638,
1880
+ "number": 694,
1881
+ "precision": 0.9585714285714285,
1882
+ "recall": 0.9668587896253602
1883
+ },
1884
+ "eval_TITRE": {
1885
+ "f1": 0.0,
1886
+ "number": 2,
1887
+ "precision": 0.0,
1888
+ "recall": 0.0
1889
+ },
1890
+ "eval_TITREH": {
1891
+ "f1": 0.8285714285714285,
1892
+ "number": 33,
1893
+ "precision": 0.7837837837837838,
1894
+ "recall": 0.8787878787878788
1895
+ },
1896
+ "eval_TITREP": {
1897
+ "f1": 0.28571428571428575,
1898
+ "number": 6,
1899
+ "precision": 0.25,
1900
+ "recall": 0.3333333333333333
1901
+ },
1902
+ "eval_accuracy": 0.9579853201721084,
1903
+ "eval_accuracy-all": 0.9677929638066313,
1904
+ "eval_accuracy-das": 0.9754492533535813,
1905
+ "eval_accuracy-l1": 0.9646924829157175,
1906
+ "eval_accuracy-l2": 0.9708934446975449,
1907
+ "eval_f1": 0.9568491167101071,
1908
+ "eval_f1-all": 0.9554549437709947,
1909
+ "eval_f1-das": 0.9595997034840623,
1910
+ "eval_f1-l1": 0.96002090410243,
1911
+ "eval_f1-l2": 0.9496688741721854,
1912
+ "eval_loss": 0.18735294044017792,
1913
+ "eval_precision": 0.953260242354299,
1914
+ "eval_precision-all": 0.95059575704737,
1915
+ "eval_precision-das": 0.9549981556621173,
1916
+ "eval_precision-l1": 0.9557752341311134,
1917
+ "eval_precision-l2": 0.9440421329822252,
1918
+ "eval_recall": 0.9604651162790697,
1919
+ "eval_recall-all": 0.9603640634174986,
1920
+ "eval_recall-das": 0.964245810055866,
1921
+ "eval_recall-l1": 0.9643044619422572,
1922
+ "eval_recall-l2": 0.955363091272485,
1923
+ "eval_runtime": 5.4368,
1924
+ "eval_samples_per_second": 124.338,
1925
+ "eval_steps_per_second": 7.909,
1926
+ "step": 1900
1927
+ },
1928
+ {
1929
+ "epoch": 5.25,
1930
+ "learning_rate": 6e-05,
1931
+ "loss": 0.0555,
1932
+ "step": 2000
1933
+ },
1934
+ {
1935
+ "epoch": 5.25,
1936
+ "eval_ACT": {
1937
+ "f1": 0.9514747859181732,
1938
+ "number": 519,
1939
+ "precision": 0.9398496240601504,
1940
+ "recall": 0.9633911368015414
1941
+ },
1942
+ "eval_ACT_L1": {
1943
+ "f1": 0.970414201183432,
1944
+ "number": 503,
1945
+ "precision": 0.9628180039138943,
1946
+ "recall": 0.9781312127236581
1947
+ },
1948
+ "eval_ACT_L2": {
1949
+ "f1": 0.4324324324324324,
1950
+ "number": 16,
1951
+ "precision": 0.38095238095238093,
1952
+ "recall": 0.5
1953
+ },
1954
+ "eval_CARDINAL": {
1955
+ "f1": 0.9874723655121592,
1956
+ "number": 678,
1957
+ "precision": 0.9867452135493373,
1958
+ "recall": 0.9882005899705014
1959
+ },
1960
+ "eval_DESC": {
1961
+ "f1": 0.5538461538461538,
1962
+ "number": 30,
1963
+ "precision": 0.5142857142857142,
1964
+ "recall": 0.6
1965
+ },
1966
+ "eval_FT": {
1967
+ "f1": 0.30769230769230765,
1968
+ "number": 7,
1969
+ "precision": 0.3333333333333333,
1970
+ "recall": 0.2857142857142857
1971
+ },
1972
+ "eval_LOC": {
1973
+ "f1": 0.9625246548323472,
1974
+ "number": 761,
1975
+ "precision": 0.9631578947368421,
1976
+ "recall": 0.961892247043364
1977
+ },
1978
+ "eval_PER": {
1979
+ "f1": 0.9800148038490007,
1980
+ "number": 676,
1981
+ "precision": 0.9807407407407407,
1982
+ "recall": 0.9792899408284024
1983
+ },
1984
+ "eval_SPAT": {
1985
+ "f1": 0.9612625538020085,
1986
+ "number": 694,
1987
+ "precision": 0.9571428571428572,
1988
+ "recall": 0.9654178674351584
1989
+ },
1990
+ "eval_TITRE": {
1991
+ "f1": 0.0,
1992
+ "number": 2,
1993
+ "precision": 0.0,
1994
+ "recall": 0.0
1995
+ },
1996
+ "eval_TITREH": {
1997
+ "f1": 0.8923076923076922,
1998
+ "number": 33,
1999
+ "precision": 0.90625,
2000
+ "recall": 0.8787878787878788
2001
+ },
2002
+ "eval_TITREP": {
2003
+ "f1": 0.5,
2004
+ "number": 6,
2005
+ "precision": 0.5,
2006
+ "recall": 0.5
2007
+ },
2008
+ "eval_accuracy": 0.958744621614781,
2009
+ "eval_accuracy-all": 0.9686155403695267,
2010
+ "eval_accuracy-das": 0.9762085547962541,
2011
+ "eval_accuracy-l1": 0.9640597317134902,
2012
+ "eval_accuracy-l2": 0.9731713490255631,
2013
+ "eval_f1": 0.9654571843251089,
2014
+ "eval_f1-all": 0.9620846142585272,
2015
+ "eval_f1-das": 0.9683897359613239,
2016
+ "eval_f1-l1": 0.9628855201254575,
2017
+ "eval_f1-l2": 0.9610648918469219,
2018
+ "eval_loss": 0.18852506577968597,
2019
+ "eval_precision": 0.9640579710144928,
2020
+ "eval_precision-all": 0.9594160583941606,
2021
+ "eval_precision-das": 0.966951355365763,
2022
+ "eval_precision-l1": 0.9588755856324831,
2023
+ "eval_precision-l2": 0.9601063829787234,
2024
+ "eval_recall": 0.9668604651162791,
2025
+ "eval_recall-all": 0.9647680563711099,
2026
+ "eval_recall-das": 0.9698324022346368,
2027
+ "eval_recall-l1": 0.9669291338582677,
2028
+ "eval_recall-l2": 0.9620253164556962,
2029
+ "eval_runtime": 5.6224,
2030
+ "eval_samples_per_second": 120.232,
2031
+ "eval_steps_per_second": 7.648,
2032
+ "step": 2000
2033
+ }
2034
+ ],
2035
+ "max_steps": 5000,
2036
+ "num_train_epochs": 14,
2037
+ "total_flos": 813927239246016.0,
2038
+ "trial_name": null,
2039
+ "trial_params": null
2040
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fafe089429a55c7d806db2eb03e3c43b298ca050f16f8611d2b68740fabcbe5d
3
+ size 3503