creat89 commited on
Commit
3f5242e
0 Parent(s):

Upload model

Browse files

.gitattributes ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bin.* filter=lfs diff=lfs merge=lfs -text
5
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.model filter=lfs diff=lfs merge=lfs -text
12
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
13
+ *.onnx filter=lfs diff=lfs merge=lfs -text
14
+ *.ot filter=lfs diff=lfs merge=lfs -text
15
+ *.parquet filter=lfs diff=lfs merge=lfs -text
16
+ *.pb filter=lfs diff=lfs merge=lfs -text
17
+ *.pt filter=lfs diff=lfs merge=lfs -text
18
+ *.pth filter=lfs diff=lfs merge=lfs -text
19
+ *.rar filter=lfs diff=lfs merge=lfs -text
20
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
21
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
22
+ *.tflite filter=lfs diff=lfs merge=lfs -text
23
+ *.tgz filter=lfs diff=lfs merge=lfs -text
24
+ *.xz filter=lfs diff=lfs merge=lfs -text
25
+ *.zip filter=lfs diff=lfs merge=lfs -text
26
+ *.zstandard filter=lfs diff=lfs merge=lfs -text
27
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ ---
2
+ license: mit
3
+ ---
config.json ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "BERT_model_multidata"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "directionality": "bidi",
7
+ "finetuning_task": "2021ru_da-IOBES-S__t_EC__",
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 768,
11
+ "id2label": {
12
+ "0": "LABEL_0",
13
+ "1": "LABEL_1",
14
+ "2": "LABEL_2",
15
+ "3": "LABEL_3",
16
+ "4": "LABEL_4",
17
+ "5": "LABEL_5",
18
+ "6": "LABEL_6",
19
+ "7": "LABEL_7",
20
+ "8": "LABEL_8",
21
+ "9": "LABEL_9",
22
+ "10": "LABEL_10",
23
+ "11": "LABEL_11",
24
+ "12": "LABEL_12",
25
+ "13": "LABEL_13",
26
+ "14": "LABEL_14",
27
+ "15": "LABEL_15",
28
+ "16": "LABEL_16",
29
+ "17": "LABEL_17",
30
+ "18": "LABEL_18",
31
+ "19": "LABEL_19",
32
+ "20": "LABEL_20",
33
+ "21": "LABEL_21",
34
+ "22": "LABEL_22",
35
+ "23": "LABEL_23",
36
+ "24": "LABEL_24",
37
+ "25": "LABEL_25",
38
+ "26": "LABEL_26",
39
+ "27": "LABEL_27",
40
+ "28": "LABEL_28",
41
+ "29": "LABEL_29",
42
+ "30": "LABEL_30",
43
+ "31": "LABEL_31"
44
+ },
45
+ "initializer_range": 0.02,
46
+ "intermediate_size": 3072,
47
+ "label2id": {
48
+ "B-EVT": 20,
49
+ "B-GEOPOLIT": 28,
50
+ "B-LOC": 8,
51
+ "B-MEDIA": 24,
52
+ "B-ORG": 12,
53
+ "B-PER": 4,
54
+ "B-PRO": 16,
55
+ "E-EVT": 22,
56
+ "E-GEOPOLIT": 30,
57
+ "E-LOC": 10,
58
+ "E-MEDIA": 26,
59
+ "E-ORG": 14,
60
+ "E-PER": 6,
61
+ "E-PRO": 18,
62
+ "I-EVT": 21,
63
+ "I-GEOPOLIT": 29,
64
+ "I-LOC": 9,
65
+ "I-MEDIA": 25,
66
+ "I-ORG": 13,
67
+ "I-PER": 5,
68
+ "I-PRO": 17,
69
+ "O": 1,
70
+ "S-EVT": 23,
71
+ "S-GEOPOLIT": 31,
72
+ "S-LOC": 11,
73
+ "S-MEDIA": 27,
74
+ "S-ORG": 15,
75
+ "S-PER": 7,
76
+ "S-PRO": 19,
77
+ "[CLS]": 2,
78
+ "[SEP]": 3
79
+ },
80
+ "layer_norm_eps": 1e-12,
81
+ "max_position_embeddings": 512,
82
+ "model_type": "bert",
83
+ "num_attention_heads": 12,
84
+ "num_hidden_layers": 12,
85
+ "output_past": true,
86
+ "pad_token_id": 0,
87
+ "pooler_fc_size": 768,
88
+ "pooler_num_attention_heads": 12,
89
+ "pooler_num_fc_layers": 3,
90
+ "pooler_size_per_head": 128,
91
+ "pooler_type": "first_token_transform",
92
+ "task_specific_params": {
93
+ "bert_hidden_size": 768,
94
+ "biaffine": false,
95
+ "boundaries_labels": null,
96
+ "crf": true,
97
+ "md_model": true,
98
+ "md_number": 4,
99
+ "predict_boundaries": false,
100
+ "predict_masked": true,
101
+ "type_crf_constraints": "BIOES"
102
+ },
103
+ "type_vocab_size": 2,
104
+ "vocab_size": 119570
105
+ }
mapping.pkl ADDED
Binary file
params-2021ru_da-IOBES-S__t_EC__.txt ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 12
2
+ file_extension: txt
3
+ experiment_name: 2021ru_da-IOBES-S__t_EC__
4
+ tags2use: NER_IOBES
5
+ special_labesl: True
6
+ force_size: False
7
+ train_file: train_*
8
+ masking_percentage: 0.25
9
+ seed: 12
10
+ epochs: 20
11
+ early_stop: 2
12
+ separator:
13
+ test_file: test
14
+ dev_file: dev_*
15
+ crf: True
16
+ uppercase: False
17
+ lr: 2e-05
18
+ epsilon: 1e-08
19
+ bert_model: /home/lcabrera/BERT_Models/rubert-base-cased/
20
+ mask_entities: False
21
+ train_batch_size: 8
22
+ comment_line: -DOCSTART
23
+ sequence_size: 128
24
+ multi_gpu: False
25
+ fullwords_mask: None
26
+ redundant_uppercase: None
27
+ bert_hidden_size: 768
28
+ no_dev: False
29
+ multidata_model: Daume
30
+ training_datasets: ['train_0_wikiann_ru', 'train_1_final_ru', 'train_2_factrueval', 'train_3_collection5']
31
+ predict_boundaries: False
32
+ biaffine: False
33
+ uppercase_percentahe: 0.0
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c169cef73b7de59bdfe4154c74d5aa7e70b1a683a1676ebea255b28122aa86bf
3
+ size 1090436421
vocab.txt ADDED
The diff for this file is too large to render. See raw diff