asahi417 commited on
Commit
9bb2646
1 Parent(s): 41c9d81
config.json ADDED
@@ -0,0 +1,138 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "xlm-roberta-base",
3
+ "architectures": [
4
+ "XLMRobertaForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "eos_token_id": 2,
9
+ "gradient_checkpointing": false,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
+ "id2label": {
14
+ "0": "B-organization",
15
+ "1": "O",
16
+ "2": "B-other",
17
+ "3": "B-person",
18
+ "4": "I-person",
19
+ "5": "B-location",
20
+ "6": "I-organization",
21
+ "7": "I-other",
22
+ "8": "I-location",
23
+ "9": "B-cardinal number",
24
+ "10": "B-date",
25
+ "11": "I-date",
26
+ "12": "B-group",
27
+ "13": "B-geopolitical area",
28
+ "14": "I-geopolitical area",
29
+ "15": "B-law",
30
+ "16": "I-law",
31
+ "17": "B-percent",
32
+ "18": "I-percent",
33
+ "19": "B-ordinal number",
34
+ "20": "B-money",
35
+ "21": "I-money",
36
+ "22": "B-work of art",
37
+ "23": "I-work of art",
38
+ "24": "B-facility",
39
+ "25": "B-time",
40
+ "26": "I-cardinal number",
41
+ "27": "B-quantity",
42
+ "28": "I-quantity",
43
+ "29": "I-group",
44
+ "30": "B-product",
45
+ "31": "I-time",
46
+ "32": "B-event",
47
+ "33": "I-event",
48
+ "34": "I-facility",
49
+ "35": "B-language",
50
+ "36": "I-product",
51
+ "37": "I-ordinal number",
52
+ "38": "I-language",
53
+ "39": "B-chemical",
54
+ "40": "B-disease",
55
+ "41": "I-disease",
56
+ "42": "I-chemical",
57
+ "43": "B-dna",
58
+ "44": "I-dna",
59
+ "45": "B-protein",
60
+ "46": "I-protein",
61
+ "47": "B-cell type",
62
+ "48": "I-cell type",
63
+ "49": "B-cell line",
64
+ "50": "I-cell line",
65
+ "51": "B-rna",
66
+ "52": "I-rna",
67
+ "53": "B-corporation",
68
+ "54": "I-corporation"
69
+ },
70
+ "initializer_range": 0.02,
71
+ "intermediate_size": 3072,
72
+ "label2id": {
73
+ "B-cardinal number": 9,
74
+ "B-cell line": 49,
75
+ "B-cell type": 47,
76
+ "B-chemical": 39,
77
+ "B-corporation": 53,
78
+ "B-date": 10,
79
+ "B-disease": 40,
80
+ "B-dna": 43,
81
+ "B-event": 32,
82
+ "B-facility": 24,
83
+ "B-geopolitical area": 13,
84
+ "B-group": 12,
85
+ "B-language": 35,
86
+ "B-law": 15,
87
+ "B-location": 5,
88
+ "B-money": 20,
89
+ "B-ordinal number": 19,
90
+ "B-organization": 0,
91
+ "B-other": 2,
92
+ "B-percent": 17,
93
+ "B-person": 3,
94
+ "B-product": 30,
95
+ "B-protein": 45,
96
+ "B-quantity": 27,
97
+ "B-rna": 51,
98
+ "B-time": 25,
99
+ "B-work of art": 22,
100
+ "I-cardinal number": 26,
101
+ "I-cell line": 50,
102
+ "I-cell type": 48,
103
+ "I-chemical": 42,
104
+ "I-corporation": 54,
105
+ "I-date": 11,
106
+ "I-disease": 41,
107
+ "I-dna": 44,
108
+ "I-event": 33,
109
+ "I-facility": 34,
110
+ "I-geopolitical area": 14,
111
+ "I-group": 29,
112
+ "I-language": 38,
113
+ "I-law": 16,
114
+ "I-location": 8,
115
+ "I-money": 21,
116
+ "I-ordinal number": 37,
117
+ "I-organization": 6,
118
+ "I-other": 7,
119
+ "I-percent": 18,
120
+ "I-person": 4,
121
+ "I-product": 36,
122
+ "I-protein": 46,
123
+ "I-quantity": 28,
124
+ "I-rna": 52,
125
+ "I-time": 31,
126
+ "I-work of art": 23,
127
+ "O": 1
128
+ },
129
+ "layer_norm_eps": 1e-05,
130
+ "max_position_embeddings": 514,
131
+ "model_type": "xlm-roberta",
132
+ "num_attention_heads": 12,
133
+ "num_hidden_layers": 12,
134
+ "output_past": true,
135
+ "pad_token_id": 1,
136
+ "type_vocab_size": 1,
137
+ "vocab_size": 250002
138
+ }
events.out.tfevents.1609932275.comsc-ISRMOT-220.1171340.0 ADDED
Binary file (1.6 MB). View file
 
parameter.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"dataset": ["conll2003", "ontonotes5", "bc5cdr", "bionlp2004", "fin", "wnut2017", "panx_dataset/en"], "transformers_model": "xlm-roberta-base", "random_seed": 1234, "lr": 1e-05, "total_step": 15000, "warmup_step": 700, "weight_decay": 1e-07, "batch_size": 32, "max_seq_length": 128, "fp16": false, "max_grad_norm": 1.0, "lower_case": false}
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ff2ff283222fd7933343608b058c5e0ee3cf53294927f54dd250d87db775e0d
3
+ size 1110067033
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
3
+ size 5069051
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "</s>", "pad_token": "<pad>", "cls_token": "<s>", "mask_token": "<mask>"}
test_bc5cdr.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 80.23514458214171, "recall": 79.3359865940511, "precision": 81.15491750589243, "summary": " precision recall f1-score support\n\n chemical 0.88 0.83 0.85 5324\n disease 0.73 0.75 0.74 4224\n\n micro avg 0.81 0.79 0.80 9548\n macro avg 0.81 0.79 0.80 9548\nweighted avg 0.81 0.79 0.80 9548\n"}, "test": {"f1": 79.43848902501277, "recall": 79.47906026557712, "precision": 79.39795918367348, "summary": " precision recall f1-score support\n\n chemical 0.85 0.83 0.84 5374\n disease 0.73 0.75 0.74 4416\n\n micro avg 0.79 0.79 0.79 9790\n macro avg 0.79 0.79 0.79 9790\nweighted avg 0.80 0.79 0.80 9790\n"}}
test_bc5cdr_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 80.87837479446243, "recall": 79.84918307498953, "precision": 81.93444384739388, "summary": " precision recall f1-score support\n\n entity 0.82 0.80 0.81 9548\n\n micro avg 0.82 0.80 0.81 9548\n macro avg 0.82 0.80 0.81 9548\nweighted avg 0.82 0.80 0.81 9548\n"}, "test": {"f1": 80.02044467160746, "recall": 79.9591419816139, "precision": 80.08184143222506, "summary": " precision recall f1-score support\n\n entity 0.80 0.80 0.80 9790\n\n micro avg 0.80 0.80 0.80 9790\n macro avg 0.80 0.80 0.80 9790\nweighted avg 0.80 0.80 0.80 9790\n"}}
test_bionlp2004.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 72.85890491768113, "recall": 78.59539511743607, "precision": 67.90283886445422, "summary": " precision recall f1-score support\n\n cell line 0.50 0.66 0.57 500\n cell type 0.75 0.73 0.74 1919\n dna 0.65 0.76 0.70 1054\n protein 0.69 0.83 0.75 5052\n rna 0.60 0.78 0.68 118\n\n micro avg 0.68 0.79 0.73 8643\n macro avg 0.64 0.75 0.69 8643\nweighted avg 0.68 0.79 0.73 8643\n"}}
test_bionlp2004_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 78.14962755046962, "recall": 83.75564040263798, "precision": 73.24698978043104, "summary": " precision recall f1-score support\n\n entity 0.73 0.84 0.78 8643\n\n micro avg 0.73 0.84 0.78 8643\n macro avg 0.73 0.84 0.78 8643\nweighted avg 0.73 0.84 0.78 8643\n"}}
test_conll2003.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 89.10754358708786, "recall": 87.12236286919831, "precision": 91.18530295000883, "summary": " precision recall f1-score support\n\n location 0.94 0.84 0.89 1837\norganization 0.84 0.90 0.87 1341\n other 0.86 0.71 0.78 922\n person 0.96 0.96 0.96 1825\n\n micro avg 0.91 0.87 0.89 5925\n macro avg 0.90 0.85 0.87 5925\nweighted avg 0.91 0.87 0.89 5925\n"}, "test": {"f1": 87.15473317243229, "recall": 86.54358246050063, "precision": 87.77457688152683, "summary": " precision recall f1-score support\n\n location 0.91 0.83 0.87 1660\norganization 0.83 0.89 0.86 1661\n other 0.75 0.70 0.72 702\n person 0.95 0.95 0.95 1610\n\n micro avg 0.88 0.87 0.87 5633\n macro avg 0.86 0.84 0.85 5633\nweighted avg 0.88 0.87 0.87 5633\n"}}
test_conll2003_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 93.0795847750865, "recall": 90.80168776371308, "precision": 95.47471162377995, "summary": " precision recall f1-score support\n\n entity 0.95 0.91 0.93 5925\n\n micro avg 0.95 0.91 0.93 5925\n macro avg 0.95 0.91 0.93 5925\nweighted avg 0.95 0.91 0.93 5925\n"}, "test": {"f1": 92.37113402061856, "recall": 91.4610331972306, "precision": 93.29952915610285, "summary": " precision recall f1-score support\n\n entity 0.93 0.91 0.92 5633\n\n micro avg 0.93 0.91 0.92 5633\n macro avg 0.93 0.91 0.92 5633\nweighted avg 0.93 0.91 0.92 5633\n"}}
test_fin.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 72.38095238095238, "recall": 73.64341085271317, "precision": 71.16104868913857, "summary": " precision recall f1-score support\n\n location 0.38 0.37 0.38 35\norganization 0.38 0.48 0.42 50\n other 1.00 0.33 0.50 6\n person 0.90 0.90 0.90 167\n\n micro avg 0.71 0.74 0.72 258\n macro avg 0.67 0.52 0.55 258\nweighted avg 0.73 0.74 0.73 258\n"}}
test_fin_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 74.80916030534351, "recall": 75.96899224806202, "precision": 73.68421052631578, "summary": " precision recall f1-score support\n\n entity 0.74 0.76 0.75 258\n\n micro avg 0.74 0.76 0.75 258\n macro avg 0.74 0.76 0.75 258\nweighted avg 0.74 0.76 0.75 258\n"}}
test_ontonotes5.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 84.13521731353961, "recall": 85.2096730368626, "precision": 83.08752097500663, "summary": " precision recall f1-score support\n\n cardinal number 0.82 0.82 0.82 937\n date 0.80 0.83 0.82 1507\n event 0.65 0.57 0.60 143\n facility 0.48 0.57 0.52 115\ngeopolitical area 0.93 0.90 0.91 2262\n group 0.89 0.87 0.88 847\n language 0.64 0.76 0.69 33\n law 0.47 0.47 0.48 40\n location 0.44 0.68 0.54 204\n money 0.87 0.89 0.88 274\n ordinal number 0.84 0.81 0.82 232\n organization 0.81 0.84 0.83 1728\n percent 0.90 0.90 0.90 177\n person 0.90 0.94 0.92 2014\n product 0.60 0.64 0.62 72\n quantity 0.73 0.76 0.75 100\n time 0.68 0.76 0.72 214\n work of art 0.40 0.46 0.43 142\n\n micro avg 0.83 0.85 0.84 11041\n macro avg 0.71 0.75 0.73 11041\n weighted avg 0.84 0.85 0.84 11041\n"}, "test": {"f1": 85.83381038354837, "recall": 86.62341125233313, "precision": 85.05847442834701, "summary": " precision recall f1-score support\n\n cardinal number 0.83 0.82 0.83 934\n date 0.81 0.85 0.83 1601\n event 0.56 0.56 0.56 63\n facility 0.69 0.67 0.68 135\ngeopolitical area 0.95 0.92 0.94 2240\n group 0.86 0.86 0.86 841\n language 0.71 0.45 0.56 22\n law 0.65 0.50 0.56 40\n location 0.49 0.73 0.59 179\n money 0.87 0.89 0.88 314\n ordinal number 0.82 0.92 0.87 195\n organization 0.83 0.87 0.85 1792\n percent 0.87 0.87 0.87 348\n person 0.93 0.94 0.93 1988\n product 0.61 0.57 0.59 76\n quantity 0.74 0.76 0.75 105\n time 0.60 0.66 0.63 212\n work of art 0.52 0.51 0.52 166\n\n micro avg 0.85 0.87 0.86 11251\n macro avg 0.74 0.74 0.74 11251\n weighted avg 0.85 0.87 0.86 11251\n"}}
test_ontonotes5_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 89.20559277075935, "recall": 89.8559913051354, "precision": 88.5645420460632, "summary": " precision recall f1-score support\n\n entity 0.89 0.90 0.89 11041\n\n micro avg 0.89 0.90 0.89 11041\n macro avg 0.89 0.90 0.89 11041\nweighted avg 0.89 0.90 0.89 11041\n"}, "test": {"f1": 89.70731275974887, "recall": 90.1697626877611, "precision": 89.24958212369138, "summary": " precision recall f1-score support\n\n entity 0.89 0.90 0.90 11251\n\n micro avg 0.89 0.90 0.90 11251\n macro avg 0.89 0.90 0.90 11251\nweighted avg 0.89 0.90 0.90 11251\n"}}
test_panx_dataset-en.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 79.24275541140801, "recall": 79.62451292950762, "precision": 78.8646410778191, "summary": " precision recall f1-score support\n\n location 0.80 0.81 0.80 4803\norganization 0.71 0.69 0.70 4677\n person 0.86 0.89 0.87 4635\n\n micro avg 0.79 0.80 0.79 14115\n macro avg 0.79 0.80 0.79 14115\nweighted avg 0.79 0.80 0.79 14115\n"}, "test": {"f1": 79.12734579640461, "recall": 79.35799625737728, "precision": 78.89803220035778, "summary": " precision recall f1-score support\n\n location 0.79 0.80 0.80 4633\norganization 0.72 0.69 0.70 4744\n person 0.85 0.90 0.87 4517\n\n micro avg 0.79 0.79 0.79 13894\n macro avg 0.79 0.80 0.79 13894\nweighted avg 0.79 0.79 0.79 13894\n"}}
test_panx_dataset-en_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 89.29884032114185, "recall": 88.65037194473963, "precision": 89.95686556434221, "summary": " precision recall f1-score support\n\n entity 0.90 0.89 0.89 14115\n\n micro avg 0.90 0.89 0.89 14115\n macro avg 0.90 0.89 0.89 14115\nweighted avg 0.90 0.89 0.89 14115\n"}, "test": {"f1": 89.26135539108982, "recall": 88.54181661148696, "precision": 89.9926847110461, "summary": " precision recall f1-score support\n\n entity 0.90 0.89 0.89 13894\n\n micro avg 0.90 0.89 0.89 13894\n macro avg 0.90 0.89 0.89 13894\nweighted avg 0.90 0.89 0.89 13894\n"}}
test_wnut2017.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 57.63888888888889, "recall": 49.641148325358856, "precision": 68.70860927152319, "summary": " precision recall f1-score support\n\n corporation 0.00 0.00 0.00 34\n group 0.04 0.03 0.03 39\n location 0.50 0.22 0.30 74\n person 0.79 0.72 0.75 470\n product 0.62 0.28 0.39 114\n work of art 0.44 0.27 0.33 105\n\n micro avg 0.69 0.50 0.58 836\n macro avg 0.40 0.25 0.30 836\nweighted avg 0.63 0.50 0.55 836\n"}, "test": {"f1": 49.55555555555556, "recall": 41.41132776230269, "precision": 61.68741355463347, "summary": " precision recall f1-score support\n\n corporation 0.40 0.03 0.06 66\n group 0.50 0.11 0.18 165\n location 0.61 0.43 0.51 150\n person 0.67 0.73 0.70 428\n product 0.23 0.08 0.12 127\n work of art 0.57 0.28 0.38 141\n\n micro avg 0.62 0.41 0.50 1077\n macro avg 0.50 0.28 0.32 1077\nweighted avg 0.56 0.41 0.44 1077\n"}}
test_wnut2017_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 64.85734168406402, "recall": 55.74162679425837, "precision": 77.53743760399334, "summary": " precision recall f1-score support\n\n entity 0.78 0.56 0.65 836\n\n micro avg 0.78 0.56 0.65 836\n macro avg 0.78 0.56 0.65 836\nweighted avg 0.78 0.56 0.65 836\n"}, "test": {"f1": 55.839822024471644, "recall": 46.61095636025998, "precision": 69.62552011095701, "summary": " precision recall f1-score support\n\n entity 0.70 0.47 0.56 1077\n\n micro avg 0.70 0.47 0.56 1077\n macro avg 0.70 0.47 0.56 1077\nweighted avg 0.70 0.47 0.56 1077\n"}}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "sep_token": "</s>", "cls_token": "<s>", "unk_token": "<unk>", "pad_token": "<pad>", "mask_token": "<mask>", "model_max_length": 512, "name_or_path": "xlm-roberta-base"}