asahi417 commited on
Commit
3eb32c8
1 Parent(s): 961a8e6
config.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "xlm-roberta-base",
3
+ "architectures": [
4
+ "XLMRobertaForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "eos_token_id": 2,
9
+ "gradient_checkpointing": false,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
+ "id2label": {
14
+ "0": "B-organization",
15
+ "1": "I-organization",
16
+ "2": "O",
17
+ "3": "B-location",
18
+ "4": "I-location",
19
+ "5": "B-person",
20
+ "6": "I-person"
21
+ },
22
+ "initializer_range": 0.02,
23
+ "intermediate_size": 3072,
24
+ "label2id": {
25
+ "B-location": 3,
26
+ "B-organization": 0,
27
+ "B-person": 5,
28
+ "I-location": 4,
29
+ "I-organization": 1,
30
+ "I-person": 6,
31
+ "O": 2
32
+ },
33
+ "layer_norm_eps": 1e-05,
34
+ "max_position_embeddings": 514,
35
+ "model_type": "xlm-roberta",
36
+ "num_attention_heads": 12,
37
+ "num_hidden_layers": 12,
38
+ "output_past": true,
39
+ "pad_token_id": 1,
40
+ "type_vocab_size": 1,
41
+ "vocab_size": 250002
42
+ }
parameter.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"dataset": ["panx_dataset/en"], "transformers_model": "xlm-roberta-base", "random_seed": 1234, "lr": 1e-05, "total_step": 13000, "warmup_step": 700, "weight_decay": 1e-07, "batch_size": 16, "max_seq_length": 128, "fp16": false, "max_grad_norm": 1.0, "lower_case": false}
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbfe9b7f5e3969752f64761d448d990498d01bb33ffa8f9740f501932c1732e4
3
+ size 1109919359
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
3
+ size 5069051
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "</s>", "pad_token": "<pad>", "cls_token": "<s>", "mask_token": "<mask>"}
test_bc5cdr_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 0.0, "recall": 0.0, "precision": 0.0, "summary": ""}, "test": {"f1": 0.0, "recall": 0.0, "precision": 0.0, "summary": ""}}
test_bionlp2004_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 0.0, "recall": 0.0, "precision": 0.0, "summary": ""}}
test_conll2003_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 69.75833900612662, "recall": 81.93084149510294, "precision": 60.73492369239888, "summary": " precision recall f1-score support\n\n entity 0.61 0.82 0.70 5003\n\n micro avg 0.61 0.82 0.70 5003\n macro avg 0.61 0.82 0.70 5003\nweighted avg 0.61 0.82 0.70 5003\n"}, "test": {"f1": 71.84055031307875, "recall": 82.59987832082741, "precision": 63.56117353308365, "summary": " precision recall f1-score support\n\n entity 0.64 0.83 0.72 4931\n\n micro avg 0.64 0.83 0.72 4931\n macro avg 0.64 0.83 0.72 4931\nweighted avg 0.64 0.83 0.72 4931\n"}}
test_fin_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 11.45374449339207, "recall": 15.476190476190476, "precision": 9.090909090909092, "summary": " precision recall f1-score support\n\n entity 0.09 0.15 0.11 252\n\n micro avg 0.09 0.15 0.11 252\n macro avg 0.09 0.15 0.11 252\nweighted avg 0.09 0.15 0.11 252\n"}}
test_ontonotes5_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 28.662420382165603, "recall": 61.581348200709584, "precision": 18.677940046118373, "summary": " precision recall f1-score support\n\n entity 0.19 0.62 0.29 3946\n\n micro avg 0.19 0.62 0.29 3946\n macro avg 0.19 0.62 0.29 3946\nweighted avg 0.19 0.62 0.29 3946\n"}, "test": {"f1": 30.20544142143254, "recall": 61.83379641323567, "precision": 19.983673469387757, "summary": " precision recall f1-score support\n\n entity 0.20 0.62 0.30 3959\n\n micro avg 0.20 0.62 0.30 3959\n macro avg 0.20 0.62 0.30 3959\nweighted avg 0.20 0.62 0.30 3959\n"}}
test_panx_dataset-ar.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 44.83532934131736, "recall": 47.84769681370374, "precision": 42.179798137860885, "summary": " precision recall f1-score support\n\n location 0.31 0.35 0.33 3856\norganization 0.31 0.45 0.37 3596\n person 0.76 0.64 0.69 3815\n\n micro avg 0.42 0.48 0.45 11267\n macro avg 0.46 0.48 0.46 11267\nweighted avg 0.46 0.48 0.46 11267\n"}, "test": {"f1": 44.44628853574541, "recall": 47.5708322231104, "precision": 41.70689923687899, "summary": " precision recall f1-score support\n\n location 0.31 0.36 0.33 3780\norganization 0.31 0.44 0.36 3629\n person 0.74 0.62 0.68 3850\n\n micro avg 0.42 0.48 0.44 11259\n macro avg 0.45 0.47 0.46 11259\nweighted avg 0.46 0.48 0.46 11259\n"}}
test_panx_dataset-en.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 83.47069757654401, "recall": 84.3074743181013, "precision": 82.65036810668148, "summary": " precision recall f1-score support\n\n location 0.85 0.87 0.86 4803\norganization 0.75 0.76 0.75 4677\n person 0.89 0.90 0.89 4635\n\n micro avg 0.83 0.84 0.83 14115\n macro avg 0.83 0.84 0.83 14115\nweighted avg 0.83 0.84 0.83 14115\n"}, "test": {"f1": 82.78416984290955, "recall": 83.63322297394559, "precision": 81.95218280555751, "summary": " precision recall f1-score support\n\n location 0.83 0.86 0.84 4633\norganization 0.75 0.75 0.75 4744\n person 0.88 0.91 0.89 4517\n\n micro avg 0.82 0.84 0.83 13894\n macro avg 0.82 0.84 0.83 13894\nweighted avg 0.82 0.84 0.83 13894\n"}}
test_panx_dataset-en_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 92.57296304148117, "recall": 92.80906836698549, "precision": 92.33805596673011, "summary": " precision recall f1-score support\n\n entity 0.92 0.93 0.93 14115\n\n micro avg 0.92 0.93 0.93 14115\n macro avg 0.92 0.93 0.93 14115\nweighted avg 0.92 0.93 0.93 14115\n"}, "test": {"f1": 92.58686981206655, "recall": 92.72347776018425, "precision": 92.45066379619664, "summary": " precision recall f1-score support\n\n entity 0.92 0.93 0.93 13894\n\n micro avg 0.92 0.93 0.93 13894\n macro avg 0.92 0.93 0.93 13894\nweighted avg 0.92 0.93 0.93 13894\n"}}
test_panx_dataset-es.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 73.24065008811435, "recall": 76.21026894865525, "precision": 70.49378062570675, "summary": " precision recall f1-score support\n\n location 0.76 0.72 0.74 4567\norganization 0.53 0.74 0.62 3737\n person 0.89 0.82 0.86 3966\n\n micro avg 0.70 0.76 0.73 12270\n macro avg 0.73 0.76 0.74 12270\nweighted avg 0.73 0.76 0.74 12270\n"}, "test": {"f1": 73.828125, "recall": 77.07993474714519, "precision": 70.83958020989505, "summary": " precision recall f1-score support\n\n location 0.78 0.73 0.76 4725\norganization 0.52 0.75 0.61 3576\n person 0.89 0.83 0.86 3959\n\n micro avg 0.71 0.77 0.74 12260\n macro avg 0.73 0.77 0.74 12260\nweighted avg 0.74 0.77 0.75 12260\n"}}
test_panx_dataset-ja.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 38.5978059130556, "recall": 43.02169732522678, "precision": 34.99889384027053, "summary": " precision recall f1-score support\n\n location 0.43 0.62 0.51 19595\norganization 0.24 0.37 0.29 16328\n person 0.41 0.26 0.32 15558\n\n micro avg 0.35 0.43 0.39 51481\n macro avg 0.36 0.41 0.37 51481\nweighted avg 0.36 0.43 0.38 51481\n"}, "test": {"f1": 38.5978059130556, "recall": 43.02169732522678, "precision": 34.99889384027053, "summary": " precision recall f1-score support\n\n location 0.43 0.62 0.51 19595\norganization 0.24 0.37 0.29 16328\n person 0.41 0.26 0.32 15558\n\n micro avg 0.35 0.43 0.39 51481\n macro avg 0.36 0.41 0.37 51481\nweighted avg 0.36 0.43 0.38 51481\n"}}
test_panx_dataset-ko.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 51.73495194739505, "recall": 52.69629731400701, "precision": 50.80805404689362, "summary": " precision recall f1-score support\n\n location 0.59 0.56 0.58 5997\norganization 0.35 0.47 0.40 4459\n person 0.66 0.53 0.59 4101\n\n micro avg 0.51 0.53 0.52 14557\n macro avg 0.53 0.52 0.52 14557\nweighted avg 0.54 0.53 0.53 14557\n"}, "test": {"f1": 50.36039389529965, "recall": 51.59120848644526, "precision": 49.186938127974614, "summary": " precision recall f1-score support\n\n location 0.57 0.56 0.56 5855\norganization 0.33 0.47 0.39 4319\n person 0.65 0.51 0.57 4249\n\n micro avg 0.49 0.52 0.50 14423\n macro avg 0.52 0.51 0.51 14423\nweighted avg 0.52 0.52 0.51 14423\n"}}
test_panx_dataset-ru.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 65.6405201501308, "recall": 70.18809794065186, "precision": 61.64637185786512, "summary": " precision recall f1-score support\n\n location 0.56 0.81 0.66 4852\norganization 0.61 0.68 0.64 3892\n person 0.77 0.57 0.66 3590\n\n micro avg 0.62 0.70 0.66 12334\n macro avg 0.65 0.69 0.66 12334\nweighted avg 0.64 0.70 0.66 12334\n"}, "test": {"f1": 65.67015445939212, "recall": 70.35394596370206, "precision": 61.571079488285186, "summary": " precision recall f1-score support\n\n location 0.55 0.81 0.66 4560\norganization 0.61 0.68 0.64 4074\n person 0.77 0.59 0.67 3543\n\n micro avg 0.62 0.70 0.66 12177\n macro avg 0.65 0.69 0.66 12177\nweighted avg 0.64 0.70 0.66 12177\n"}}
test_wnut2017_span.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"valid": {"f1": 48.82051282051282, "recall": 43.75, "precision": 55.22041763341067, "summary": " precision recall f1-score support\n\n entity 0.55 0.44 0.49 544\n\n micro avg 0.55 0.44 0.49 544\n macro avg 0.55 0.44 0.49 544\nweighted avg 0.55 0.44 0.49 544\n"}, "test": {"f1": 45.3307392996109, "recall": 40.31141868512111, "precision": 51.77777777777778, "summary": " precision recall f1-score support\n\n entity 0.52 0.40 0.45 578\n\n micro avg 0.52 0.40 0.45 578\n macro avg 0.52 0.40 0.45 578\nweighted avg 0.52 0.40 0.45 578\n"}}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "sep_token": "</s>", "cls_token": "<s>", "unk_token": "<unk>", "pad_token": "<pad>", "mask_token": "<mask>", "model_max_length": 512, "name_or_path": "xlm-roberta-base"}