elshehawy commited on
Commit
5c8c0da
1 Parent(s): 4ecda2f

Training in progress, epoch 1

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "nlpaueb/sec-bert-shape",
3
+ "architectures": [
4
+ "BertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "gradient_checkpointing": false,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 768,
12
+ "id2label": {
13
+ "0": "O",
14
+ "1": "B-PER",
15
+ "2": "I-PER",
16
+ "3": "B-ORG",
17
+ "4": "I-ORG",
18
+ "5": "B-LOC",
19
+ "6": "I-LOC",
20
+ "7": "B-MISC",
21
+ "8": "I-MISC"
22
+ },
23
+ "initializer_range": 0.02,
24
+ "intermediate_size": 3072,
25
+ "label2id": {
26
+ "B-LOC": 5,
27
+ "B-MISC": 7,
28
+ "B-ORG": 3,
29
+ "B-PER": 1,
30
+ "I-LOC": 6,
31
+ "I-MISC": 8,
32
+ "I-ORG": 4,
33
+ "I-PER": 2,
34
+ "O": 0
35
+ },
36
+ "layer_norm_eps": 1e-12,
37
+ "max_position_embeddings": 512,
38
+ "model_type": "bert",
39
+ "num_attention_heads": 12,
40
+ "num_hidden_layers": 12,
41
+ "pad_token_id": 0,
42
+ "position_embedding_type": "absolute",
43
+ "torch_dtype": "float32",
44
+ "transformers_version": "4.30.2",
45
+ "type_vocab_size": 2,
46
+ "use_cache": true,
47
+ "vocab_size": 30000
48
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80f97c965846c5a3dda22fc0d11c511d086563521adf79304e6d4eb8fd5f4ea1
3
+ size 434061105
runs/Sep11_15-54-35_nyf2wftun0/events.out.tfevents.1694447696.nyf2wftun0.655.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28726b64c62788689313ca71131e689066d362aa57a834fad780827bb1d61131
3
+ size 4383
runs/Sep11_15-54-35_nyf2wftun0/events.out.tfevents.1694447854.nyf2wftun0.655.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb91420ecde17cf51d99ba99dadf55eb6875dae4fb7e661ebfafd71409703cc8
3
+ size 5358
special_tokens_map.json ADDED
@@ -0,0 +1,224 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "[NUM]",
4
+ "[X]",
5
+ "[X.X]",
6
+ "[X.XX]",
7
+ "[X.XXX]",
8
+ "[X.XXXX]",
9
+ "[X.XXXXX]",
10
+ "[X.XXXXXX]",
11
+ "[X.XXXXXXX]",
12
+ "[X.XXXXXXXX]",
13
+ "[X.XXXXXXXXX]",
14
+ "[X,XXX.X]",
15
+ "[X,XXX.XX]",
16
+ "[X,XXX.XXX]",
17
+ "[X,XXX,XXX]",
18
+ "[X,XXX,XXX.X]",
19
+ "[X,XXX,XXX.XX]",
20
+ "[X,XXX,XXX.XXX]",
21
+ "[X,XXX,XXX,XXX]",
22
+ "[X,XXX,XXX,XXX.X]",
23
+ "[X,XXX,XXX,XXX.XX]",
24
+ "[X,XXX,XXX,XXX.XXX]",
25
+ "[X,XXX,XXX,XXX,XXX]",
26
+ "[X,XXX,XXX,XXX,XXX.X]",
27
+ "[X,XXX,XXX,XXX,XXX.XX]",
28
+ "[X,XXX,XXX,XXX,XXX.XXX]",
29
+ "[XX.X]",
30
+ "[XX.XX]",
31
+ "[XX.XXX]",
32
+ "[XX.XXXX]",
33
+ "[XX.XXXXX]",
34
+ "[XX.XXXXXX]",
35
+ "[XX.XXXXXXX]",
36
+ "[XX.XXXXXXXX]",
37
+ "[XX.XXXXXXXXX]",
38
+ "[XX,XXX.X]",
39
+ "[XX,XXX.XX]",
40
+ "[XX,XXX.XXX]",
41
+ "[XX,XXX,XXX]",
42
+ "[XX,XXX,XXX.X]",
43
+ "[XX,XXX,XXX.XX]",
44
+ "[XX,XXX,XXX.XXX]",
45
+ "[XX,XXX,XXX,XXX]",
46
+ "[XX,XXX,XXX,XXX.X]",
47
+ "[XX,XXX,XXX,XXX.XX]",
48
+ "[XX,XXX,XXX,XXX.XXX]",
49
+ "[XX,XXX,XXX,XXX,XXX]",
50
+ "[XX,XXX,XXX,XXX,XXX.X]",
51
+ "[XX,XXX,XXX,XXX,XXX.XX]",
52
+ "[XX,XXX,XXX,XXX,XXX.XXX]",
53
+ "[XXX]",
54
+ "[XXX.X]",
55
+ "[XXX.XX]",
56
+ "[XXX.XXX]",
57
+ "[XXX.XXXX]",
58
+ "[XXX.XXXXX]",
59
+ "[XXX.XXXXXX]",
60
+ "[XXX.XXXXXXX]",
61
+ "[XXX.XXXXXXXX]",
62
+ "[XXX.XXXXXXXXX]",
63
+ "[XXX,XXX.X]",
64
+ "[XXX,XXX.XX]",
65
+ "[XXX,XXX.XXX]",
66
+ "[XXX,XXX,XXX]",
67
+ "[XXX,XXX,XXX.X]",
68
+ "[XXX,XXX,XXX.XX]",
69
+ "[XXX,XXX,XXX.XXX]",
70
+ "[XXX,XXX,XXX,XXX]",
71
+ "[XXX,XXX,XXX,XXX.X]",
72
+ "[XXX,XXX,XXX,XXX.XX]",
73
+ "[XXX,XXX,XXX,XXX.XXX]",
74
+ "[XXX,XXX,XXX,XXX,XXX]",
75
+ "[XXX,XXX,XXX,XXX,XXX.X]",
76
+ "[XXX,XXX,XXX,XXX,XXX.XX]",
77
+ "[XXX,XXX,XXX,XXX,XXX.XXX]",
78
+ "[XXXX.X]",
79
+ "[XXXX.XX]",
80
+ "[XXXX.XXX]",
81
+ "[XXXXX]",
82
+ "[XXXXX.X]",
83
+ "[XXXXX.XX]",
84
+ "[XXXXX.XXX]",
85
+ "[XXXXXX]",
86
+ "[XXXXXX.X]",
87
+ "[XXXXXX.XX]",
88
+ "[XXXXXX.XXX]",
89
+ "[XXXXXXX]",
90
+ "[XXXXXXX.X]",
91
+ "[XXXXXXX.XX]",
92
+ "[XXXXXXX.XXX]",
93
+ "[XXXXXXXX]",
94
+ "[XXXXXXXX.X]",
95
+ "[XXXXXXXX.XX]",
96
+ "[XXXXXXXX.XXX]",
97
+ "[XXXXXXXXX]",
98
+ "[XXXXXXXXX.X]",
99
+ "[XXXXXXXXX.XX]",
100
+ "[XXXXXXXXX.XXX]",
101
+ "[XXXXXXXXXX]",
102
+ "[XXXXXXXXXX.X]",
103
+ "[XXXXXXXXXX.XX]",
104
+ "[XXXXXXXXXX.XXX]",
105
+ "[X,X]",
106
+ "[X,XX]",
107
+ "[X,XXX]",
108
+ "[X,XXXX]",
109
+ "[X,XXXXX]",
110
+ "[X,XXXXXX]",
111
+ "[X,XXXXXXX]",
112
+ "[X,XXXXXXXX]",
113
+ "[X,XXXXXXXXX]",
114
+ "[X.XXX,X]",
115
+ "[X.XXX,XX]",
116
+ "[X.XXX,XXX]",
117
+ "[X.XXX.XXX]",
118
+ "[X.XXX.XXX,X]",
119
+ "[X.XXX.XXX,XX]",
120
+ "[X.XXX.XXX,XXX]",
121
+ "[X.XXX.XXX.XXX]",
122
+ "[X.XXX.XXX.XXX,X]",
123
+ "[X.XXX.XXX.XXX,XX]",
124
+ "[X.XXX.XXX.XXX,XXX]",
125
+ "[X.XXX.XXX.XXX.XXX]",
126
+ "[X.XXX.XXX.XXX.XXX,X]",
127
+ "[X.XXX.XXX.XXX.XXX,XX]",
128
+ "[X.XXX.XXX.XXX.XXX,XXX]",
129
+ "[XX]",
130
+ "[XX,X]",
131
+ "[XX,XX]",
132
+ "[XX,XXX]",
133
+ "[XX,XXXX]",
134
+ "[XX,XXXXX]",
135
+ "[XX,XXXXXX]",
136
+ "[XX,XXXXXXX]",
137
+ "[XX,XXXXXXXX]",
138
+ "[XX,XXXXXXXXX]",
139
+ "[XX.XXX,X]",
140
+ "[XX.XXX,XX]",
141
+ "[XX.XXX,XXX]",
142
+ "[XX.XXX.XXX]",
143
+ "[XX.XXX.XXX,X]",
144
+ "[XX.XXX.XXX,XX]",
145
+ "[XX.XXX.XXX,XXX]",
146
+ "[XX.XXX.XXX.XXX]",
147
+ "[XX.XXX.XXX.XXX,X]",
148
+ "[XX.XXX.XXX.XXX,XX]",
149
+ "[XX.XXX.XXX.XXX,XXX]",
150
+ "[XX.XXX.XXX.XXX.XXX]",
151
+ "[XX.XXX.XXX.XXX.XXX,X]",
152
+ "[XX.XXX.XXX.XXX.XXX,XX]",
153
+ "[XX.XXX.XXX.XXX.XXX,XXX]",
154
+ "[XXX,X]",
155
+ "[XXX,XX]",
156
+ "[XXX,XXX]",
157
+ "[XXX,XXXX]",
158
+ "[XXX,XXXXX]",
159
+ "[XXX,XXXXXX]",
160
+ "[XXX,XXXXXXX]",
161
+ "[XXX,XXXXXXXX]",
162
+ "[XXX,XXXXXXXXX]",
163
+ "[XXX.XXX,X]",
164
+ "[XXX.XXX,XX]",
165
+ "[XXX.XXX,XXX]",
166
+ "[XXX.XXX.XXX]",
167
+ "[XXX.XXX.XXX,X]",
168
+ "[XXX.XXX.XXX,XX]",
169
+ "[XXX.XXX.XXX,XXX]",
170
+ "[XXX.XXX.XXX.XXX]",
171
+ "[XXX.XXX.XXX.XXX,X]",
172
+ "[XXX.XXX.XXX.XXX,XX]",
173
+ "[XXX.XXX.XXX.XXX,XXX]",
174
+ "[XXX.XXX.XXX.XXX.XXX]",
175
+ "[XXX.XXX.XXX.XXX.XXX,X]",
176
+ "[XXX.XXX.XXX.XXX.XXX,XX]",
177
+ "[XXX.XXX.XXX.XXX.XXX,XXX]",
178
+ "[XXXX]",
179
+ "[XXXX,X]",
180
+ "[XXXX,XX]",
181
+ "[XXXX,XXX]",
182
+ "[XXXXX,X]",
183
+ "[XXXXX,XX]",
184
+ "[XXXXX,XXX]",
185
+ "[XXXXXX,X]",
186
+ "[XXXXXX,XX]",
187
+ "[XXXXXX,XXX]",
188
+ "[XXXXXXX,X]",
189
+ "[XXXXXXX,XX]",
190
+ "[XXXXXXX,XXX]",
191
+ "[XXXXXXXX,X]",
192
+ "[XXXXXXXX,XX]",
193
+ "[XXXXXXXX,XXX]",
194
+ "[XXXXXXXXX,X]",
195
+ "[XXXXXXXXX,XX]",
196
+ "[XXXXXXXXX,XXX]",
197
+ "[XXXXXXXXXX,X]",
198
+ "[XXXXXXXXXX,XX]",
199
+ "[XXXXXXXXXX,XXX]",
200
+ "[.X]",
201
+ "[.XX]",
202
+ "[.XXX]",
203
+ "[.XXXX]",
204
+ "[.XXXXX]",
205
+ "[.XXXXXX]",
206
+ "[.XXXXXXX]",
207
+ "[.XXXXXXXX]",
208
+ "[.XXXXXXXXX]",
209
+ "[,X]",
210
+ "[,XX]",
211
+ "[,XXX]",
212
+ "[,XXXX]",
213
+ "[,XXXXX]",
214
+ "[,XXXXXX]",
215
+ "[,XXXXXXX]",
216
+ "[,XXXXXXXX]",
217
+ "[,XXXXXXXXX]"
218
+ ],
219
+ "cls_token": "[CLS]",
220
+ "mask_token": "[MASK]",
221
+ "pad_token": "[PAD]",
222
+ "sep_token": "[SEP]",
223
+ "unk_token": "[UNK]"
224
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,232 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "[NUM]",
4
+ "[X]",
5
+ "[X.X]",
6
+ "[X.XX]",
7
+ "[X.XXX]",
8
+ "[X.XXXX]",
9
+ "[X.XXXXX]",
10
+ "[X.XXXXXX]",
11
+ "[X.XXXXXXX]",
12
+ "[X.XXXXXXXX]",
13
+ "[X.XXXXXXXXX]",
14
+ "[X,XXX.X]",
15
+ "[X,XXX.XX]",
16
+ "[X,XXX.XXX]",
17
+ "[X,XXX,XXX]",
18
+ "[X,XXX,XXX.X]",
19
+ "[X,XXX,XXX.XX]",
20
+ "[X,XXX,XXX.XXX]",
21
+ "[X,XXX,XXX,XXX]",
22
+ "[X,XXX,XXX,XXX.X]",
23
+ "[X,XXX,XXX,XXX.XX]",
24
+ "[X,XXX,XXX,XXX.XXX]",
25
+ "[X,XXX,XXX,XXX,XXX]",
26
+ "[X,XXX,XXX,XXX,XXX.X]",
27
+ "[X,XXX,XXX,XXX,XXX.XX]",
28
+ "[X,XXX,XXX,XXX,XXX.XXX]",
29
+ "[XX.X]",
30
+ "[XX.XX]",
31
+ "[XX.XXX]",
32
+ "[XX.XXXX]",
33
+ "[XX.XXXXX]",
34
+ "[XX.XXXXXX]",
35
+ "[XX.XXXXXXX]",
36
+ "[XX.XXXXXXXX]",
37
+ "[XX.XXXXXXXXX]",
38
+ "[XX,XXX.X]",
39
+ "[XX,XXX.XX]",
40
+ "[XX,XXX.XXX]",
41
+ "[XX,XXX,XXX]",
42
+ "[XX,XXX,XXX.X]",
43
+ "[XX,XXX,XXX.XX]",
44
+ "[XX,XXX,XXX.XXX]",
45
+ "[XX,XXX,XXX,XXX]",
46
+ "[XX,XXX,XXX,XXX.X]",
47
+ "[XX,XXX,XXX,XXX.XX]",
48
+ "[XX,XXX,XXX,XXX.XXX]",
49
+ "[XX,XXX,XXX,XXX,XXX]",
50
+ "[XX,XXX,XXX,XXX,XXX.X]",
51
+ "[XX,XXX,XXX,XXX,XXX.XX]",
52
+ "[XX,XXX,XXX,XXX,XXX.XXX]",
53
+ "[XXX]",
54
+ "[XXX.X]",
55
+ "[XXX.XX]",
56
+ "[XXX.XXX]",
57
+ "[XXX.XXXX]",
58
+ "[XXX.XXXXX]",
59
+ "[XXX.XXXXXX]",
60
+ "[XXX.XXXXXXX]",
61
+ "[XXX.XXXXXXXX]",
62
+ "[XXX.XXXXXXXXX]",
63
+ "[XXX,XXX.X]",
64
+ "[XXX,XXX.XX]",
65
+ "[XXX,XXX.XXX]",
66
+ "[XXX,XXX,XXX]",
67
+ "[XXX,XXX,XXX.X]",
68
+ "[XXX,XXX,XXX.XX]",
69
+ "[XXX,XXX,XXX.XXX]",
70
+ "[XXX,XXX,XXX,XXX]",
71
+ "[XXX,XXX,XXX,XXX.X]",
72
+ "[XXX,XXX,XXX,XXX.XX]",
73
+ "[XXX,XXX,XXX,XXX.XXX]",
74
+ "[XXX,XXX,XXX,XXX,XXX]",
75
+ "[XXX,XXX,XXX,XXX,XXX.X]",
76
+ "[XXX,XXX,XXX,XXX,XXX.XX]",
77
+ "[XXX,XXX,XXX,XXX,XXX.XXX]",
78
+ "[XXXX.X]",
79
+ "[XXXX.XX]",
80
+ "[XXXX.XXX]",
81
+ "[XXXXX]",
82
+ "[XXXXX.X]",
83
+ "[XXXXX.XX]",
84
+ "[XXXXX.XXX]",
85
+ "[XXXXXX]",
86
+ "[XXXXXX.X]",
87
+ "[XXXXXX.XX]",
88
+ "[XXXXXX.XXX]",
89
+ "[XXXXXXX]",
90
+ "[XXXXXXX.X]",
91
+ "[XXXXXXX.XX]",
92
+ "[XXXXXXX.XXX]",
93
+ "[XXXXXXXX]",
94
+ "[XXXXXXXX.X]",
95
+ "[XXXXXXXX.XX]",
96
+ "[XXXXXXXX.XXX]",
97
+ "[XXXXXXXXX]",
98
+ "[XXXXXXXXX.X]",
99
+ "[XXXXXXXXX.XX]",
100
+ "[XXXXXXXXX.XXX]",
101
+ "[XXXXXXXXXX]",
102
+ "[XXXXXXXXXX.X]",
103
+ "[XXXXXXXXXX.XX]",
104
+ "[XXXXXXXXXX.XXX]",
105
+ "[X,X]",
106
+ "[X,XX]",
107
+ "[X,XXX]",
108
+ "[X,XXXX]",
109
+ "[X,XXXXX]",
110
+ "[X,XXXXXX]",
111
+ "[X,XXXXXXX]",
112
+ "[X,XXXXXXXX]",
113
+ "[X,XXXXXXXXX]",
114
+ "[X.XXX,X]",
115
+ "[X.XXX,XX]",
116
+ "[X.XXX,XXX]",
117
+ "[X.XXX.XXX]",
118
+ "[X.XXX.XXX,X]",
119
+ "[X.XXX.XXX,XX]",
120
+ "[X.XXX.XXX,XXX]",
121
+ "[X.XXX.XXX.XXX]",
122
+ "[X.XXX.XXX.XXX,X]",
123
+ "[X.XXX.XXX.XXX,XX]",
124
+ "[X.XXX.XXX.XXX,XXX]",
125
+ "[X.XXX.XXX.XXX.XXX]",
126
+ "[X.XXX.XXX.XXX.XXX,X]",
127
+ "[X.XXX.XXX.XXX.XXX,XX]",
128
+ "[X.XXX.XXX.XXX.XXX,XXX]",
129
+ "[XX]",
130
+ "[XX,X]",
131
+ "[XX,XX]",
132
+ "[XX,XXX]",
133
+ "[XX,XXXX]",
134
+ "[XX,XXXXX]",
135
+ "[XX,XXXXXX]",
136
+ "[XX,XXXXXXX]",
137
+ "[XX,XXXXXXXX]",
138
+ "[XX,XXXXXXXXX]",
139
+ "[XX.XXX,X]",
140
+ "[XX.XXX,XX]",
141
+ "[XX.XXX,XXX]",
142
+ "[XX.XXX.XXX]",
143
+ "[XX.XXX.XXX,X]",
144
+ "[XX.XXX.XXX,XX]",
145
+ "[XX.XXX.XXX,XXX]",
146
+ "[XX.XXX.XXX.XXX]",
147
+ "[XX.XXX.XXX.XXX,X]",
148
+ "[XX.XXX.XXX.XXX,XX]",
149
+ "[XX.XXX.XXX.XXX,XXX]",
150
+ "[XX.XXX.XXX.XXX.XXX]",
151
+ "[XX.XXX.XXX.XXX.XXX,X]",
152
+ "[XX.XXX.XXX.XXX.XXX,XX]",
153
+ "[XX.XXX.XXX.XXX.XXX,XXX]",
154
+ "[XXX,X]",
155
+ "[XXX,XX]",
156
+ "[XXX,XXX]",
157
+ "[XXX,XXXX]",
158
+ "[XXX,XXXXX]",
159
+ "[XXX,XXXXXX]",
160
+ "[XXX,XXXXXXX]",
161
+ "[XXX,XXXXXXXX]",
162
+ "[XXX,XXXXXXXXX]",
163
+ "[XXX.XXX,X]",
164
+ "[XXX.XXX,XX]",
165
+ "[XXX.XXX,XXX]",
166
+ "[XXX.XXX.XXX]",
167
+ "[XXX.XXX.XXX,X]",
168
+ "[XXX.XXX.XXX,XX]",
169
+ "[XXX.XXX.XXX,XXX]",
170
+ "[XXX.XXX.XXX.XXX]",
171
+ "[XXX.XXX.XXX.XXX,X]",
172
+ "[XXX.XXX.XXX.XXX,XX]",
173
+ "[XXX.XXX.XXX.XXX,XXX]",
174
+ "[XXX.XXX.XXX.XXX.XXX]",
175
+ "[XXX.XXX.XXX.XXX.XXX,X]",
176
+ "[XXX.XXX.XXX.XXX.XXX,XX]",
177
+ "[XXX.XXX.XXX.XXX.XXX,XXX]",
178
+ "[XXXX]",
179
+ "[XXXX,X]",
180
+ "[XXXX,XX]",
181
+ "[XXXX,XXX]",
182
+ "[XXXXX,X]",
183
+ "[XXXXX,XX]",
184
+ "[XXXXX,XXX]",
185
+ "[XXXXXX,X]",
186
+ "[XXXXXX,XX]",
187
+ "[XXXXXX,XXX]",
188
+ "[XXXXXXX,X]",
189
+ "[XXXXXXX,XX]",
190
+ "[XXXXXXX,XXX]",
191
+ "[XXXXXXXX,X]",
192
+ "[XXXXXXXX,XX]",
193
+ "[XXXXXXXX,XXX]",
194
+ "[XXXXXXXXX,X]",
195
+ "[XXXXXXXXX,XX]",
196
+ "[XXXXXXXXX,XXX]",
197
+ "[XXXXXXXXXX,X]",
198
+ "[XXXXXXXXXX,XX]",
199
+ "[XXXXXXXXXX,XXX]",
200
+ "[.X]",
201
+ "[.XX]",
202
+ "[.XXX]",
203
+ "[.XXXX]",
204
+ "[.XXXXX]",
205
+ "[.XXXXXX]",
206
+ "[.XXXXXXX]",
207
+ "[.XXXXXXXX]",
208
+ "[.XXXXXXXXX]",
209
+ "[,X]",
210
+ "[,XX]",
211
+ "[,XXX]",
212
+ "[,XXXX]",
213
+ "[,XXXXX]",
214
+ "[,XXXXXX]",
215
+ "[,XXXXXXX]",
216
+ "[,XXXXXXXX]",
217
+ "[,XXXXXXXXX]"
218
+ ],
219
+ "clean_up_tokenization_spaces": true,
220
+ "cls_token": "[CLS]",
221
+ "do_basic_tokenize": true,
222
+ "do_lower_case": true,
223
+ "mask_token": "[MASK]",
224
+ "model_max_length": 512,
225
+ "never_split": null,
226
+ "pad_token": "[PAD]",
227
+ "sep_token": "[SEP]",
228
+ "strip_accents": null,
229
+ "tokenize_chinese_chars": true,
230
+ "tokenizer_class": "BertTokenizer",
231
+ "unk_token": "[UNK]"
232
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ae95ec62ddeb350f24381f41e4cbbbab71871d091d9ecc78944d9715edf4738
3
+ size 3951
vocab.txt ADDED
The diff for this file is too large to render. See raw diff