willemjan commited on
Commit
706c0f3
1 Parent(s): 59422c3

Dutch_1800-2000

Browse files
added_tokens.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {}
config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "BertForMaskedLM"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "directionality": "bidi",
7
+ "finetuning_task": "ner",
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 768,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 3072,
13
+ "layer_norm_eps": 1e-12,
14
+ "max_position_embeddings": 512,
15
+ "model_type": "bert",
16
+ "num_attention_heads": 12,
17
+ "num_hidden_layers": 12,
18
+ "num_labels": 20,
19
+ "output_attentions": false,
20
+ "output_hidden_states": false,
21
+ "pad_token_id": 0,
22
+ "pooler_fc_size": 768,
23
+ "pooler_num_attention_heads": 12,
24
+ "pooler_num_fc_layers": 3,
25
+ "pooler_size_per_head": 128,
26
+ "pooler_type": "first_token_transform",
27
+ "pruned_heads": {},
28
+ "torchscript": false,
29
+ "type_vocab_size": 2,
30
+ "vocab_size": 119547
31
+ }
eval_results.txt ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ precision recall f1-score support
2
+
3
+ DAT 0.0000 0.0000 0.0000 0
4
+ DOM 0.0000 0.0000 0.0000 0
5
+ LOC 0.8797 0.4209 0.5693 278
6
+ MISC 0.0000 0.0000 0.0000 423
7
+ ORG 0.5939 0.3111 0.4083 315
8
+ PER 0.7939 0.5084 0.6199 356
9
+ QUA 0.0000 0.0000 0.0000 0
10
+ REF 0.0000 0.0000 0.0000 0
11
+ SEP] 0.0000 0.0000 0.0000 0
12
+
13
+ micro avg 0.4526 0.2886 0.3525 1372
14
+ macro avg 0.2519 0.1378 0.1775 1372
15
+ weighted avg 0.5206 0.2886 0.3700 1372
model_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bert_model": "bert-base-multilingual-cased", "do_lower": false, "max_seq_length": 180, "num_labels": 20, "label_map": {"1": "O", "2": "B-PER", "3": "I-PER", "4": "B-ORG", "5": "I-ORG", "6": "B-LOC", "7": "I-LOC", "8": "B-DAT", "9": "I-DAT", "10": "B-REF", "11": "I-REF", "12": "B-DOM", "13": "I-DOM", "14": "B-QUA", "15": "I-QUA", "16": "B-MISC", "17": "I-MISC", "18": "[CLS]", "19": "[SEP]"}}
nl2.txt ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ precision recall f1-score support
2
+
3
+ DAT 0.0000 0.0000 0.0000 0
4
+ DOM 0.0000 0.0000 0.0000 0
5
+ LOC 0.8797 0.4209 0.5693 278
6
+ MISC 0.0000 0.0000 0.0000 423
7
+ ORG 0.5939 0.3111 0.4083 315
8
+ PER 0.7939 0.5084 0.6199 356
9
+ QUA 0.0000 0.0000 0.0000 0
10
+ REF 0.0000 0.0000 0.0000 0
11
+ SEP] 0.0000 0.0000 0.0000 0
12
+
13
+ micro avg 0.4526 0.2886 0.3525 1372
14
+ macro avg 0.2519 0.1378 0.1775 1372
15
+ weighted avg 0.5206 0.2886 0.3700 1372
16
+
17
+ 01/13/2022 01:22:06 - INFO - __main__ - ***** Eval results *****
18
+ 01/13/2022 01:22:06 - INFO - __main__ -
19
+ precision recall f1-score support
20
+
21
+ DAT 0.0000 0.0000 0.0000 0
22
+ DOM 0.0000 0.0000 0.0000 0
23
+ LOC 0.8797 0.4209 0.5693 278
24
+ MISC 0.0000 0.0000 0.0000 423
25
+ ORG 0.5939 0.3111 0.4083 315
26
+ PER 0.7939 0.5084 0.6199 356
27
+ QUA 0.0000 0.0000 0.0000 0
28
+ REF 0.0000 0.0000 0.0000 0
29
+ SEP] 0.0000 0.0000 0.0000 0
30
+
31
+ micro avg 0.4526 0.2886 0.3525 1372
32
+ macro avg 0.2519 0.1378 0.1775 1372
33
+ weighted avg 0.5206 0.2886 0.3700 1372
34
+
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b7f34681a842c956740b5ad6f6c28f7d2889aaab21cc27a05da9beb7c670ed0
3
+ size 711525557
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"do_lower_case": false, "max_len": 512, "init_inputs": []}
vocab.txt ADDED
The diff for this file is too large to render. See raw diff