hf-transformers-bot commited on
Commit
deb44e5
1 Parent(s): e6e1fbd

Upload tiny models for MPNetForMultipleChoice

Browse files
Files changed (7) hide show
  1. config.json +24 -0
  2. pytorch_model.bin +3 -0
  3. special_tokens_map.json +15 -0
  4. tf_model.h5 +3 -0
  5. tokenizer.json +1222 -0
  6. tokenizer_config.json +67 -0
  7. vocab.txt +1125 -0
config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "tiny_models/mpnet/MPNetForMultipleChoice",
3
+ "architectures": [
4
+ "MPNetForMultipleChoice"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 64,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 64,
14
+ "layer_norm_eps": 1e-12,
15
+ "max_position_embeddings": 512,
16
+ "model_type": "mpnet",
17
+ "num_attention_heads": 4,
18
+ "num_hidden_layers": 5,
19
+ "pad_token_id": 1,
20
+ "relative_attention_num_buckets": 32,
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.28.0.dev0",
23
+ "vocab_size": 1125
24
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97dcbec84cbe87dbec0911f7212cbe6651897a45a870f0fab8ead890b3cfb94b
3
+ size 974015
special_tokens_map.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<s>",
4
+ "eos_token": "</s>",
5
+ "mask_token": {
6
+ "content": "<mask>",
7
+ "lstrip": true,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
+ "pad_token": "<pad>",
13
+ "sep_token": "</s>",
14
+ "unk_token": "[UNK]"
15
+ }
tf_model.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88f0d03669f0f28c1cb821e37b265ccae041770441e159c7d8e9b473cf6e7bb5
3
+ size 1065792
tokenizer.json ADDED
@@ -0,0 +1,1222 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 0,
8
+ "content": "<s>",
9
+ "single_word": false,
10
+ "lstrip": false,
11
+ "rstrip": false,
12
+ "normalized": false,
13
+ "special": true
14
+ },
15
+ {
16
+ "id": 1,
17
+ "content": "<pad>",
18
+ "single_word": false,
19
+ "lstrip": false,
20
+ "rstrip": false,
21
+ "normalized": false,
22
+ "special": true
23
+ },
24
+ {
25
+ "id": 2,
26
+ "content": "</s>",
27
+ "single_word": false,
28
+ "lstrip": false,
29
+ "rstrip": false,
30
+ "normalized": false,
31
+ "special": true
32
+ },
33
+ {
34
+ "id": 3,
35
+ "content": "<unk>",
36
+ "single_word": false,
37
+ "lstrip": false,
38
+ "rstrip": false,
39
+ "normalized": true,
40
+ "special": true
41
+ },
42
+ {
43
+ "id": 4,
44
+ "content": "[UNK]",
45
+ "single_word": false,
46
+ "lstrip": false,
47
+ "rstrip": false,
48
+ "normalized": false,
49
+ "special": true
50
+ },
51
+ {
52
+ "id": 5,
53
+ "content": "<mask>",
54
+ "single_word": false,
55
+ "lstrip": true,
56
+ "rstrip": false,
57
+ "normalized": false,
58
+ "special": true
59
+ }
60
+ ],
61
+ "normalizer": {
62
+ "type": "BertNormalizer",
63
+ "clean_text": true,
64
+ "handle_chinese_chars": true,
65
+ "strip_accents": null,
66
+ "lowercase": true
67
+ },
68
+ "pre_tokenizer": {
69
+ "type": "BertPreTokenizer"
70
+ },
71
+ "post_processor": {
72
+ "type": "RobertaProcessing",
73
+ "sep": [
74
+ "</s>",
75
+ 2
76
+ ],
77
+ "cls": [
78
+ "<s>",
79
+ 0
80
+ ],
81
+ "trim_offsets": true,
82
+ "add_prefix_space": false
83
+ },
84
+ "decoder": {
85
+ "type": "WordPiece",
86
+ "prefix": "##",
87
+ "cleanup": true
88
+ },
89
+ "model": {
90
+ "type": "WordPiece",
91
+ "unk_token": "[UNK]",
92
+ "continuing_subword_prefix": "##",
93
+ "max_input_chars_per_word": 100,
94
+ "vocab": {
95
+ "<s>": 0,
96
+ "<pad>": 1,
97
+ "</s>": 2,
98
+ "<unk>": 3,
99
+ "[UNK]": 4,
100
+ "<mask>": 5,
101
+ "!": 6,
102
+ "\"": 7,
103
+ "#": 8,
104
+ "$": 9,
105
+ "%": 10,
106
+ "&": 11,
107
+ "'": 12,
108
+ "(": 13,
109
+ ")": 14,
110
+ "*": 15,
111
+ "+": 16,
112
+ ",": 17,
113
+ "-": 18,
114
+ ".": 19,
115
+ "/": 20,
116
+ "0": 21,
117
+ "1": 22,
118
+ "2": 23,
119
+ "3": 24,
120
+ "4": 25,
121
+ "5": 26,
122
+ "6": 27,
123
+ "7": 28,
124
+ "8": 29,
125
+ "9": 30,
126
+ ":": 31,
127
+ ";": 32,
128
+ "<": 33,
129
+ "=": 34,
130
+ ">": 35,
131
+ "?": 36,
132
+ "@": 37,
133
+ "[": 38,
134
+ "\\": 39,
135
+ "]": 40,
136
+ "^": 41,
137
+ "_": 42,
138
+ "`": 43,
139
+ "a": 44,
140
+ "b": 45,
141
+ "c": 46,
142
+ "d": 47,
143
+ "e": 48,
144
+ "f": 49,
145
+ "g": 50,
146
+ "h": 51,
147
+ "i": 52,
148
+ "j": 53,
149
+ "k": 54,
150
+ "l": 55,
151
+ "m": 56,
152
+ "n": 57,
153
+ "o": 58,
154
+ "p": 59,
155
+ "q": 60,
156
+ "r": 61,
157
+ "s": 62,
158
+ "t": 63,
159
+ "u": 64,
160
+ "v": 65,
161
+ "w": 66,
162
+ "x": 67,
163
+ "y": 68,
164
+ "z": 69,
165
+ "|": 70,
166
+ "}": 71,
167
+ "~": 72,
168
+ "¡": 73,
169
+ "¢": 74,
170
+ "£": 75,
171
+ "¥": 76,
172
+ "§": 77,
173
+ "°": 78,
174
+ "±": 79,
175
+ "²": 80,
176
+ "³": 81,
177
+ "´": 82,
178
+ "µ": 83,
179
+ "·": 84,
180
+ "º": 85,
181
+ "½": 86,
182
+ "¿": 87,
183
+ "×": 88,
184
+ "ß": 89,
185
+ "æ": 90,
186
+ "ð": 91,
187
+ "ø": 92,
188
+ "þ": 93,
189
+ "đ": 94,
190
+ "ħ": 95,
191
+ "ı": 96,
192
+ "ł": 97,
193
+ "œ": 98,
194
+ "ɐ": 99,
195
+ "ɑ": 100,
196
+ "ɒ": 101,
197
+ "ɔ": 102,
198
+ "ə": 103,
199
+ "ɛ": 104,
200
+ "ɜ": 105,
201
+ "ɡ": 106,
202
+ "ɢ": 107,
203
+ "ɪ": 108,
204
+ "ɫ": 109,
205
+ "ɳ": 110,
206
+ "ɽ": 111,
207
+ "ɾ": 112,
208
+ "ʁ": 113,
209
+ "ʃ": 114,
210
+ "ʊ": 115,
211
+ "ʋ": 116,
212
+ "ʒ": 117,
213
+ "ʔ": 118,
214
+ "ʕ": 119,
215
+ "ʲ": 120,
216
+ "ʻ": 121,
217
+ "ʼ": 122,
218
+ "ʾ": 123,
219
+ "ʿ": 124,
220
+ "ˈ": 125,
221
+ "ˌ": 126,
222
+ "ː": 127,
223
+ "α": 128,
224
+ "β": 129,
225
+ "γ": 130,
226
+ "δ": 131,
227
+ "ε": 132,
228
+ "η": 133,
229
+ "θ": 134,
230
+ "ι": 135,
231
+ "κ": 136,
232
+ "λ": 137,
233
+ "μ": 138,
234
+ "ν": 139,
235
+ "ξ": 140,
236
+ "ο": 141,
237
+ "π": 142,
238
+ "ρ": 143,
239
+ "ς": 144,
240
+ "σ": 145,
241
+ "τ": 146,
242
+ "υ": 147,
243
+ "φ": 148,
244
+ "χ": 149,
245
+ "ψ": 150,
246
+ "ω": 151,
247
+ "а": 152,
248
+ "б": 153,
249
+ "в": 154,
250
+ "г": 155,
251
+ "д": 156,
252
+ "е": 157,
253
+ "ж": 158,
254
+ "з": 159,
255
+ "и": 160,
256
+ "к": 161,
257
+ "л": 162,
258
+ "м": 163,
259
+ "н": 164,
260
+ "о": 165,
261
+ "п": 166,
262
+ "р": 167,
263
+ "с": 168,
264
+ "т": 169,
265
+ "у": 170,
266
+ "х": 171,
267
+ "ц": 172,
268
+ "ш": 173,
269
+ "ъ": 174,
270
+ "ы": 175,
271
+ "ь": 176,
272
+ "ю": 177,
273
+ "я": 178,
274
+ "є": 179,
275
+ "א": 180,
276
+ "ב": 181,
277
+ "ג": 182,
278
+ "ה": 183,
279
+ "ו": 184,
280
+ "ז": 185,
281
+ "ח": 186,
282
+ "י": 187,
283
+ "ל": 188,
284
+ "ם": 189,
285
+ "מ": 190,
286
+ "ן": 191,
287
+ "נ": 192,
288
+ "ס": 193,
289
+ "ף": 194,
290
+ "פ": 195,
291
+ "צ": 196,
292
+ "ר": 197,
293
+ "ש": 198,
294
+ "ת": 199,
295
+ "ء": 200,
296
+ "ا": 201,
297
+ "ب": 202,
298
+ "ة": 203,
299
+ "ت": 204,
300
+ "ث": 205,
301
+ "ج": 206,
302
+ "ح": 207,
303
+ "خ": 208,
304
+ "د": 209,
305
+ "ذ": 210,
306
+ "ر": 211,
307
+ "س": 212,
308
+ "ش": 213,
309
+ "ص": 214,
310
+ "ع": 215,
311
+ "ف": 216,
312
+ "ق": 217,
313
+ "ك": 218,
314
+ "ل": 219,
315
+ "م": 220,
316
+ "ن": 221,
317
+ "ه": 222,
318
+ "و": 223,
319
+ "ي": 224,
320
+ "ܐ": 225,
321
+ "ܕ": 226,
322
+ "ܗ": 227,
323
+ "ܝ": 228,
324
+ "ܠ": 229,
325
+ "ܢ": 230,
326
+ "ܬ": 231,
327
+ "अ": 232,
328
+ "ई": 233,
329
+ "क": 234,
330
+ "ग": 235,
331
+ "ण": 236,
332
+ "त": 237,
333
+ "द": 238,
334
+ "न": 239,
335
+ "प": 240,
336
+ "ब": 241,
337
+ "म": 242,
338
+ "य": 243,
339
+ "र": 244,
340
+ "ल": 245,
341
+ "व": 246,
342
+ "स": 247,
343
+ "ह": 248,
344
+ "ा": 249,
345
+ "ि": 250,
346
+ "আ": 251,
347
+ "ল": 252,
348
+ "হ": 253,
349
+ "া": 254,
350
+ "ਅ": 255,
351
+ "ਲ": 256,
352
+ "ਹ": 257,
353
+ "ਾ": 258,
354
+ "അ": 259,
355
+ "ള": 260,
356
+ "ഹ": 261,
357
+ "ാ": 262,
358
+ "ก": 263,
359
+ "ค": 264,
360
+ "ง": 265,
361
+ "ช": 266,
362
+ "ซ": 267,
363
+ "ญ": 268,
364
+ "ฐ": 269,
365
+ "ณ": 270,
366
+ "ด": 271,
367
+ "ต": 272,
368
+ "น": 273,
369
+ "บ": 274,
370
+ "ป": 275,
371
+ "พ": 276,
372
+ "ภ": 277,
373
+ "ม": 278,
374
+ "ย": 279,
375
+ "ร": 280,
376
+ "ล": 281,
377
+ "ว": 282,
378
+ "ศ": 283,
379
+ "ษ": 284,
380
+ "ส": 285,
381
+ "ห": 286,
382
+ "อ": 287,
383
+ "ฮ": 288,
384
+ "ะ": 289,
385
+ "า": 290,
386
+ "เ": 291,
387
+ "แ": 292,
388
+ "ไ": 293,
389
+ "ა": 294,
390
+ "ბ": 295,
391
+ "გ": 296,
392
+ "დ": 297,
393
+ "ე": 298,
394
+ "ვ": 299,
395
+ "ზ": 300,
396
+ "თ": 301,
397
+ "ი": 302,
398
+ "კ": 303,
399
+ "ლ": 304,
400
+ "მ": 305,
401
+ "ნ": 306,
402
+ "ო": 307,
403
+ "პ": 308,
404
+ "ჟ": 309,
405
+ "რ": 310,
406
+ "ს": 311,
407
+ "ტ": 312,
408
+ "უ": 313,
409
+ "ფ": 314,
410
+ "ქ": 315,
411
+ "ღ": 316,
412
+ "ყ": 317,
413
+ "შ": 318,
414
+ "ჩ": 319,
415
+ "ც": 320,
416
+ "ძ": 321,
417
+ "წ": 322,
418
+ "ჭ": 323,
419
+ "ხ": 324,
420
+ "ჯ": 325,
421
+ "ჰ": 326,
422
+ "ჱ": 327,
423
+ "ჲ": 328,
424
+ "ჳ": 329,
425
+ "ჴ": 330,
426
+ "ჵ": 331,
427
+ "ჶ": 332,
428
+ "ჷ": 333,
429
+ "ჸ": 334,
430
+ "ჹ": 335,
431
+ "ჺ": 336,
432
+ "჻": 337,
433
+ "ᄃ": 338,
434
+ "ᄅ": 339,
435
+ "ᄇ": 340,
436
+ "ᄋ": 341,
437
+ "ᄌ": 342,
438
+ "ᅡ": 343,
439
+ "ᅢ": 344,
440
+ "ᅦ": 345,
441
+ "ᅧ": 346,
442
+ "ᅩ": 347,
443
+ "ᅮ": 348,
444
+ "ᅵ": 349,
445
+ "ᆨ": 350,
446
+ "ᆫ": 351,
447
+ "ᆯ": 352,
448
+ "ᆸ": 353,
449
+ "ᆼ": 354,
450
+ "ᵻ": 355,
451
+ "‐": 356,
452
+ "‑": 357,
453
+ "–": 358,
454
+ "—": 359,
455
+ "―": 360,
456
+ "‘": 361,
457
+ "’": 362,
458
+ "“": 363,
459
+ "”": 364,
460
+ "„": 365,
461
+ "†": 366,
462
+ "‡": 367,
463
+ "•": 368,
464
+ "…": 369,
465
+ "′": 370,
466
+ "″": 371,
467
+ "⁄": 372,
468
+ "₣": 373,
469
+ "₤": 374,
470
+ "€": 375,
471
+ "₹": 376,
472
+ "⅓": 377,
473
+ "⅔": 378,
474
+ "→": 379,
475
+ "−": 380,
476
+ "≡": 381,
477
+ "≤": 382,
478
+ "①": 383,
479
+ "☉": 384,
480
+ "☫": 385,
481
+ "♀": 386,
482
+ "♭": 387,
483
+ "♯": 388,
484
+ "⚳": 389,
485
+ "ⴀ": 390,
486
+ "ⴂ": 391,
487
+ "ⴃ": 392,
488
+ "ⴈ": 393,
489
+ "ⴌ": 394,
490
+ "ⴕ": 395,
491
+ "ⴟ": 396,
492
+ "〈": 397,
493
+ "〉": 398,
494
+ "〜": 399,
495
+ "あ": 400,
496
+ "い": 401,
497
+ "う": 402,
498
+ "お": 403,
499
+ "か": 404,
500
+ "き": 405,
501
+ "く": 406,
502
+ "け": 407,
503
+ "こ": 408,
504
+ "さ": 409,
505
+ "し": 410,
506
+ "す": 411,
507
+ "せ": 412,
508
+ "た": 413,
509
+ "ち": 414,
510
+ "っ": 415,
511
+ "つ": 416,
512
+ "と": 417,
513
+ "な": 418,
514
+ "に": 419,
515
+ "の": 420,
516
+ "は": 421,
517
+ "ひ": 422,
518
+ "ふ": 423,
519
+ "ほ": 424,
520
+ "ま": 425,
521
+ "み": 426,
522
+ "め": 427,
523
+ "も": 428,
524
+ "ゃ": 429,
525
+ "ゆ": 430,
526
+ "ょ": 431,
527
+ "ら": 432,
528
+ "り": 433,
529
+ "る": 434,
530
+ "れ": 435,
531
+ "わ": 436,
532
+ "を": 437,
533
+ "ん": 438,
534
+ "ァ": 439,
535
+ "ア": 440,
536
+ "ィ": 441,
537
+ "イ": 442,
538
+ "ゥ": 443,
539
+ "ウ": 444,
540
+ "ェ": 445,
541
+ "エ": 446,
542
+ "ォ": 447,
543
+ "オ": 448,
544
+ "カ": 449,
545
+ "キ": 450,
546
+ "ク": 451,
547
+ "ケ": 452,
548
+ "コ": 453,
549
+ "サ": 454,
550
+ "シ": 455,
551
+ "ス": 456,
552
+ "セ": 457,
553
+ "タ": 458,
554
+ "チ": 459,
555
+ "ッ": 460,
556
+ "ツ": 461,
557
+ "テ": 462,
558
+ "ト": 463,
559
+ "ナ": 464,
560
+ "ニ": 465,
561
+ "ネ": 466,
562
+ "ノ": 467,
563
+ "ハ": 468,
564
+ "フ": 469,
565
+ "ヘ": 470,
566
+ "マ": 471,
567
+ "ミ": 472,
568
+ "ム": 473,
569
+ "モ": 474,
570
+ "ャ": 475,
571
+ "ュ": 476,
572
+ "ョ": 477,
573
+ "ラ": 478,
574
+ "リ": 479,
575
+ "ル": 480,
576
+ "レ": 481,
577
+ "ロ": 482,
578
+ "ン": 483,
579
+ "・": 484,
580
+ "ー": 485,
581
+ "一": 486,
582
+ "七": 487,
583
+ "下": 488,
584
+ "世": 489,
585
+ "丙": 490,
586
+ "中": 491,
587
+ "主": 492,
588
+ "乃": 493,
589
+ "之": 494,
590
+ "乙": 495,
591
+ "九": 496,
592
+ "二": 497,
593
+ "云": 498,
594
+ "人": 499,
595
+ "今": 500,
596
+ "付": 501,
597
+ "作": 502,
598
+ "侗": 503,
599
+ "依": 504,
600
+ "信": 505,
601
+ "傳": 506,
602
+ "儚": 507,
603
+ "充": 508,
604
+ "光": 509,
605
+ "全": 510,
606
+ "兵": 511,
607
+ "其": 512,
608
+ "具": 513,
609
+ "円": 514,
610
+ "再": 515,
611
+ "出": 516,
612
+ "判": 517,
613
+ "前": 518,
614
+ "剛": 519,
615
+ "劇": 520,
616
+ "劉": 521,
617
+ "動": 522,
618
+ "化": 523,
619
+ "北": 524,
620
+ "华": 525,
621
+ "厂": 526,
622
+ "去": 527,
623
+ "古": 528,
624
+ "可": 529,
625
+ "台": 530,
626
+ "史": 531,
627
+ "同": 532,
628
+ "名": 533,
629
+ "君": 534,
630
+ "吳": 535,
631
+ "周": 536,
632
+ "命": 537,
633
+ "和": 538,
634
+ "咲": 539,
635
+ "善": 540,
636
+ "四": 541,
637
+ "國": 542,
638
+ "園": 543,
639
+ "圣": 544,
640
+ "在": 545,
641
+ "坂": 546,
642
+ "堤": 547,
643
+ "場": 548,
644
+ "塘": 549,
645
+ "夕": 550,
646
+ "大": 551,
647
+ "天": 552,
648
+ "夫": 553,
649
+ "女": 554,
650
+ "妙": 555,
651
+ "姚": 556,
652
+ "子": 557,
653
+ "孟": 558,
654
+ "守": 559,
655
+ "安": 560,
656
+ "宋": 561,
657
+ "完": 562,
658
+ "宗": 563,
659
+ "宝": 564,
660
+ "宫": 565,
661
+ "寝": 566,
662
+ "寺": 567,
663
+ "小": 568,
664
+ "少": 569,
665
+ "尾": 570,
666
+ "山": 571,
667
+ "岳": 572,
668
+ "川": 573,
669
+ "州": 574,
670
+ "巳": 575,
671
+ "市": 576,
672
+ "師": 577,
673
+ "平": 578,
674
+ "广": 579,
675
+ "庆": 580,
676
+ "府": 581,
677
+ "座": 582,
678
+ "廬": 583,
679
+ "建": 584,
680
+ "式": 585,
681
+ "張": 586,
682
+ "彌": 587,
683
+ "彩": 588,
684
+ "彼": 589,
685
+ "後": 590,
686
+ "御": 591,
687
+ "德": 592,
688
+ "思": 593,
689
+ "愛": 594,
690
+ "憑": 595,
691
+ "憶": 596,
692
+ "應": 597,
693
+ "懷": 598,
694
+ "战": 599,
695
+ "戦": 600,
696
+ "扈": 601,
697
+ "技": 602,
698
+ "拉": 603,
699
+ "拳": 604,
700
+ "挑": 605,
701
+ "揺": 606,
702
+ "攻": 607,
703
+ "放": 608,
704
+ "政": 609,
705
+ "散": 610,
706
+ "斯": 611,
707
+ "方": 612,
708
+ "日": 613,
709
+ "旦": 614,
710
+ "旭": 615,
711
+ "昌": 616,
712
+ "明": 617,
713
+ "星": 618,
714
+ "春": 619,
715
+ "晋": 620,
716
+ "景": 621,
717
+ "曦": 622,
718
+ "月": 623,
719
+ "望": 624,
720
+ "未": 625,
721
+ "本": 626,
722
+ "李": 627,
723
+ "村": 628,
724
+ "杜": 629,
725
+ "束": 630,
726
+ "来": 631,
727
+ "林": 632,
728
+ "桜": 633,
729
+ "梶": 634,
730
+ "棘": 635,
731
+ "椎": 636,
732
+ "楊": 637,
733
+ "楚": 638,
734
+ "榮": 639,
735
+ "橘": 640,
736
+ "機": 641,
737
+ "正": 642,
738
+ "殻": 643,
739
+ "殿": 644,
740
+ "母": 645,
741
+ "水": 646,
742
+ "汉": 647,
743
+ "沂": 648,
744
+ "沙": 649,
745
+ "河": 650,
746
+ "泗": 651,
747
+ "波": 652,
748
+ "泣": 653,
749
+ "洪": 654,
750
+ "淹": 655,
751
+ "清": 656,
752
+ "湯": 657,
753
+ "漢": 658,
754
+ "澄": 659,
755
+ "澤": 660,
756
+ "火": 661,
757
+ "灯": 662,
758
+ "灵": 663,
759
+ "灼": 664,
760
+ "焼": 665,
761
+ "熱": 666,
762
+ "物": 667,
763
+ "狐": 668,
764
+ "狸": 669,
765
+ "玄": 670,
766
+ "王": 671,
767
+ "玩": 672,
768
+ "珂": 673,
769
+ "珙": 674,
770
+ "球": 675,
771
+ "理": 676,
772
+ "琦": 677,
773
+ "琪": 678,
774
+ "瓊": 679,
775
+ "生": 680,
776
+ "田": 681,
777
+ "畢": 682,
778
+ "番": 683,
779
+ "瘡": 684,
780
+ "白": 685,
781
+ "皮": 686,
782
+ "真": 687,
783
+ "砲": 688,
784
+ "礮": 689,
785
+ "祈": 690,
786
+ "神": 691,
787
+ "祠": 692,
788
+ "秋": 693,
789
+ "空": 694,
790
+ "立": 695,
791
+ "精": 696,
792
+ "約": 697,
793
+ "絵": 698,
794
+ "織": 699,
795
+ "義": 700,
796
+ "翠": 701,
797
+ "者": 702,
798
+ "耕": 703,
799
+ "肖": 704,
800
+ "胡": 705,
801
+ "膀": 706,
802
+ "臂": 707,
803
+ "興": 708,
804
+ "良": 709,
805
+ "花": 710,
806
+ "芳": 711,
807
+ "芽": 712,
808
+ "若": 713,
809
+ "英": 714,
810
+ "藕": 715,
811
+ "藥": 716,
812
+ "蘄": 717,
813
+ "蘇": 718,
814
+ "行": 719,
815
+ "裁": 720,
816
+ "規": 721,
817
+ "覺": 722,
818
+ "观": 723,
819
+ "解": 724,
820
+ "記": 725,
821
+ "誓": 726,
822
+ "誡": 727,
823
+ "誰": 728,
824
+ "謎": 729,
825
+ "许": 730,
826
+ "谭": 731,
827
+ "豪": 732,
828
+ "豫": 733,
829
+ "費": 734,
830
+ "贵": 735,
831
+ "赤": 736,
832
+ "趙": 737,
833
+ "足": 738,
834
+ "跡": 739,
835
+ "転": 740,
836
+ "辛": 741,
837
+ "逆": 742,
838
+ "遇": 743,
839
+ "運": 744,
840
+ "過": 745,
841
+ "遠": 746,
842
+ "選": 747,
843
+ "邦": 748,
844
+ "邱": 749,
845
+ "部": 750,
846
+ "郭": 751,
847
+ "都": 752,
848
+ "酈": 753,
849
+ "里": 754,
850
+ "野": 755,
851
+ "金": 756,
852
+ "銃": 757,
853
+ "鋼": 758,
854
+ "錄": 759,
855
+ "錡": 760,
856
+ "鍵": 761,
857
+ "鐵": 762,
858
+ "钱": 763,
859
+ "铁": 764,
860
+ "關": 765,
861
+ "防": 766,
862
+ "阿": 767,
863
+ "陈": 768,
864
+ "陳": 769,
865
+ "陽": 770,
866
+ "隊": 771,
867
+ "階": 772,
868
+ "集": 773,
869
+ "雪": 774,
870
+ "雲": 775,
871
+ "霖": 776,
872
+ "霹": 777,
873
+ "靂": 778,
874
+ "韓": 779,
875
+ "願": 780,
876
+ "顯": 781,
877
+ "颜": 782,
878
+ "马": 783,
879
+ "高": 784,
880
+ "龍": 785,
881
+ "ﷲ": 786,
882
+ "ﻋ": 787,
883
+ "/": 788,
884
+ "3": 789,
885
+ "~": 790,
886
+ "##s": 791,
887
+ "##p": 792,
888
+ "##e": 793,
889
+ "##n": 794,
890
+ "##a": 795,
891
+ "##t": 796,
892
+ "##h": 797,
893
+ "##r": 798,
894
+ "##i": 799,
895
+ "##g": 800,
896
+ "##4": 801,
897
+ "##9": 802,
898
+ "##v": 803,
899
+ "##u": 804,
900
+ "##l": 805,
901
+ "##c": 806,
902
+ "##y": 807,
903
+ "##m": 808,
904
+ "##o": 809,
905
+ "##d": 810,
906
+ "##q": 811,
907
+ "##f": 812,
908
+ "##b": 813,
909
+ "##j": 814,
910
+ "##k": 815,
911
+ "##w": 816,
912
+ "##z": 817,
913
+ "##6": 818,
914
+ "##0": 819,
915
+ "##1": 820,
916
+ "##x": 821,
917
+ "##8": 822,
918
+ "##7": 823,
919
+ "##3": 824,
920
+ "##2": 825,
921
+ "##а": 826,
922
+ "##л": 827,
923
+ "##ы": 828,
924
+ "##и": 829,
925
+ "##ル": 830,
926
+ "##ハ": 831,
927
+ "##ト": 832,
928
+ "##ス": 833,
929
+ "##5": 834,
930
+ "##р": 835,
931
+ "##с": 836,
932
+ "##н": 837,
933
+ "##ɪ": 838,
934
+ "##ʃ": 839,
935
+ "##ɑ": 840,
936
+ "##ː": 841,
937
+ "##ი": 842,
938
+ "##ウ": 843,
939
+ "##ァ": 844,
940
+ "##キ": 845,
941
+ "##ュ": 846,
942
+ "##リ": 847,
943
+ "##ア": 848,
944
+ "##う": 849,
945
+ "##き": 850,
946
+ "##ł": 851,
947
+ "##ッ": 852,
948
+ "##ク": 853,
949
+ "##マ": 854,
950
+ "##ン": 855,
951
+ "##テ": 856,
952
+ "##ィ": 857,
953
+ "##ニ": 858,
954
+ "##ー": 859,
955
+ "##ل": 860,
956
+ "##ا": 861,
957
+ "##ب": 862,
958
+ "##ن": 863,
959
+ "##ล": 864,
960
+ "##ย": 865,
961
+ "##า": 866,
962
+ "##ณ": 867,
963
+ "##ม": 868,
964
+ "##ต": 869,
965
+ "##ร": 870,
966
+ "##τ": 871,
967
+ "##ι": 872,
968
+ "##β": 873,
969
+ "##เ": 874,
970
+ "##ป": 875,
971
+ "##რ": 876,
972
+ "##გ": 877,
973
+ "##ვ": 878,
974
+ "##ლ": 879,
975
+ "##ო": 880,
976
+ "##ა": 881,
977
+ "##ნ": 882,
978
+ "##ラ": 883,
979
+ "##ъ": 884,
980
+ "##к": 885,
981
+ "##в": 886,
982
+ "##đ": 887,
983
+ "##ø": 888,
984
+ "##ɾ": 889,
985
+ "##ʲ": 890,
986
+ "##ə": 891,
987
+ "##ˈ": 892,
988
+ "##ב": 893,
989
+ "##ת": 894,
990
+ "##א": 895,
991
+ "##י": 896,
992
+ "##ك": 897,
993
+ "##ر": 898,
994
+ "##د": 899,
995
+ "##っ": 900,
996
+ "##е": 901,
997
+ "##о": 902,
998
+ "##у": 903,
999
+ "##я": 904,
1000
+ "##ɔ": 905,
1001
+ "##ʔ": 906,
1002
+ "##ذ": 907,
1003
+ "##ي": 908,
1004
+ "##ة": 909,
1005
+ "##ს": 910,
1006
+ "##ტ": 911,
1007
+ "##ე": 912,
1008
+ "##サ": 913,
1009
+ "##た": 914,
1010
+ "##し": 915,
1011
+ "##の": 916,
1012
+ "##す": 917,
1013
+ "##な": 918,
1014
+ "##ひ": 919,
1015
+ "##と": 920,
1016
+ "##ן": 921,
1017
+ "##レ": 922,
1018
+ "##チ": 923,
1019
+ "##ナ": 924,
1020
+ "##უ": 925,
1021
+ "##ც": 926,
1022
+ "##ف": 927,
1023
+ "##س": 928,
1024
+ "##ɐ": 929,
1025
+ "##ᅦ": 930,
1026
+ "##ᄃ": 931,
1027
+ "##ᅩ": 932,
1028
+ "##ᆨ": 933,
1029
+ "##ᄅ": 934,
1030
+ "##ᅵ": 935,
1031
+ "##ᆸ": 936,
1032
+ "##ᄇ": 937,
1033
+ "##ᅧ": 938,
1034
+ "##ᆼ": 939,
1035
+ "##ᄋ": 940,
1036
+ "##ᆫ": 941,
1037
+ "##ᅢ": 942,
1038
+ "##ε": 943,
1039
+ "##ρ": 944,
1040
+ "##α": 945,
1041
+ "##ς": 946,
1042
+ "##ش": 947,
1043
+ "##م": 948,
1044
+ "##و": 949,
1045
+ "##フ": 950,
1046
+ "##ロ": 951,
1047
+ "##ð": 952,
1048
+ "##ხ": 953,
1049
+ "##3": 954,
1050
+ "##æ": 955,
1051
+ "##ল": 956,
1052
+ "##ɡ": 957,
1053
+ "##ع": 958,
1054
+ "##π": 959,
1055
+ "##κ": 960,
1056
+ "##ο": 961,
1057
+ "##ق": 962,
1058
+ "##ت": 963,
1059
+ "##ɒ": 964,
1060
+ "##χ": 965,
1061
+ "##λ": 966,
1062
+ "##ภ": 967,
1063
+ "##ด": 968,
1064
+ "##п": 969,
1065
+ "##г": 970,
1066
+ "##れ": 971,
1067
+ "##る": 972,
1068
+ "##פ": 973,
1069
+ "##ה": 974,
1070
+ "##ा": 975,
1071
+ "##न": 976,
1072
+ "##ਲ": 977,
1073
+ "##ਹ": 978,
1074
+ "##ɛ": 979,
1075
+ "##ʊ": 980,
1076
+ "##ᅮ": 981,
1077
+ "##は": 982,
1078
+ "##り": 983,
1079
+ "##く": 984,
1080
+ "##あ": 985,
1081
+ "##ν": 986,
1082
+ "##μ": 987,
1083
+ "##อ": 988,
1084
+ "##ก": 989,
1085
+ "##ว": 990,
1086
+ "##ܕ": 991,
1087
+ "##ܝ": 992,
1088
+ "##ܢ": 993,
1089
+ "##ܬ": 994,
1090
+ "##ォ": 995,
1091
+ "##ه": 996,
1092
+ "##з": 997,
1093
+ "##シ": 998,
1094
+ "##მ": 999,
1095
+ "##წ": 1000,
1096
+ "##ფ": 1001,
1097
+ "##つ": 1002,
1098
+ "##か": 1003,
1099
+ "##ค": 1004,
1100
+ "##ण": 1005,
1101
+ "##ई": 1006,
1102
+ "##ξ": 1007,
1103
+ "##も": 1008,
1104
+ "##み": 1009,
1105
+ "##д": 1010,
1106
+ "##ж": 1011,
1107
+ "##т": 1012,
1108
+ "##व": 1013,
1109
+ "##द": 1014,
1110
+ "##ह": 1015,
1111
+ "##ि": 1016,
1112
+ "##क": 1017,
1113
+ "##ω": 1018,
1114
+ "##お": 1019,
1115
+ "##ʻ": 1020,
1116
+ "##ซ": 1021,
1117
+ "##せ": 1022,
1118
+ "##ん": 1023,
1119
+ "##œ": 1024,
1120
+ "##こ": 1025,
1121
+ "##ら": 1026,
1122
+ "##া": 1027,
1123
+ "##হ": 1028,
1124
+ "##η": 1029,
1125
+ "##ß": 1030,
1126
+ "##ჱ": 1031,
1127
+ "##ı": 1032,
1128
+ "##ث": 1033,
1129
+ "##ᵻ": 1034,
1130
+ "##υ": 1035,
1131
+ "##θ": 1036,
1132
+ "##ɽ": 1037,
1133
+ "##ょ": 1038,
1134
+ "##に": 1039,
1135
+ "##γ": 1040,
1136
+ "##を": 1041,
1137
+ "##พ": 1042,
1138
+ "##わ": 1043,
1139
+ "##い": 1044,
1140
+ "##ш": 1045,
1141
+ "##თ": 1046,
1142
+ "##め": 1047,
1143
+ "##カ": 1048,
1144
+ "##ʿ": 1049,
1145
+ "##ר": 1050,
1146
+ "##ם": 1051,
1147
+ "##ჲ": 1052,
1148
+ "##ネ": 1053,
1149
+ "##ョ": 1054,
1150
+ "##ψ": 1055,
1151
+ "##ち": 1056,
1152
+ "##ゃ": 1057,
1153
+ "##σ": 1058,
1154
+ "##დ": 1059,
1155
+ "##र": 1060,
1156
+ "##タ": 1061,
1157
+ "##ム": 1062,
1158
+ "##ェ": 1063,
1159
+ "##ء": 1064,
1160
+ "##ל": 1065,
1161
+ "##ɫ": 1066,
1162
+ "##х": 1067,
1163
+ "##ᅡ": 1068,
1164
+ "##ᆯ": 1069,
1165
+ "##ゥ": 1070,
1166
+ "##イ": 1071,
1167
+ "##ฮ": 1072,
1168
+ "##ง": 1073,
1169
+ "##ไ": 1074,
1170
+ "##ช": 1075,
1171
+ "##แ": 1076,
1172
+ "##ग": 1077,
1173
+ "##خ": 1078,
1174
+ "##ま": 1079,
1175
+ "##ノ": 1080,
1176
+ "##ס": 1081,
1177
+ "##ャ": 1082,
1178
+ "##モ": 1083,
1179
+ "##ल": 1084,
1180
+ "##ו": 1085,
1181
+ "##ح": 1086,
1182
+ "##ц": 1087,
1183
+ "##ь": 1088,
1184
+ "##ף": 1089,
1185
+ "##ള": 1090,
1186
+ "##δ": 1091,
1187
+ "##ਾ": 1092,
1188
+ "##м": 1093,
1189
+ "##ษ": 1094,
1190
+ "##ฐ": 1095,
1191
+ "##ാ": 1096,
1192
+ "##ഹ": 1097,
1193
+ "##ツ": 1098,
1194
+ "##セ": 1099,
1195
+ "##オ": 1100,
1196
+ "##ʒ": 1101,
1197
+ "##ქ": 1102,
1198
+ "##ю": 1103,
1199
+ "##ʁ": 1104,
1200
+ "##ˌ": 1105,
1201
+ "##स": 1106,
1202
+ "##ص": 1107,
1203
+ "##º": 1108,
1204
+ "##エ": 1109,
1205
+ "##ミ": 1110,
1206
+ "##ש": 1111,
1207
+ "##מ": 1112,
1208
+ "##צ": 1113,
1209
+ "##ɜ": 1114,
1210
+ "##ܠ": 1115,
1211
+ "##ܗ": 1116,
1212
+ "##ܐ": 1117,
1213
+ "##ะ": 1118,
1214
+ "##น": 1119,
1215
+ "##є": 1120,
1216
+ "##ゆ": 1121,
1217
+ "##ɳ": 1122,
1218
+ "##נ": 1123,
1219
+ "##ჳ": 1124
1220
+ }
1221
+ }
1222
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "__type": "AddedToken",
4
+ "content": "<s>",
5
+ "lstrip": false,
6
+ "normalized": true,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ },
10
+ "clean_up_tokenization_spaces": true,
11
+ "cls_token": {
12
+ "__type": "AddedToken",
13
+ "content": "<s>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false
18
+ },
19
+ "do_basic_tokenize": true,
20
+ "do_lower_case": true,
21
+ "eos_token": {
22
+ "__type": "AddedToken",
23
+ "content": "</s>",
24
+ "lstrip": false,
25
+ "normalized": true,
26
+ "rstrip": false,
27
+ "single_word": false
28
+ },
29
+ "mask_token": {
30
+ "__type": "AddedToken",
31
+ "content": "<mask>",
32
+ "lstrip": true,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "model_max_length": 512,
38
+ "never_split": null,
39
+ "pad_token": {
40
+ "__type": "AddedToken",
41
+ "content": "<pad>",
42
+ "lstrip": false,
43
+ "normalized": true,
44
+ "rstrip": false,
45
+ "single_word": false
46
+ },
47
+ "sep_token": {
48
+ "__type": "AddedToken",
49
+ "content": "</s>",
50
+ "lstrip": false,
51
+ "normalized": true,
52
+ "rstrip": false,
53
+ "single_word": false
54
+ },
55
+ "special_tokens_map_file": null,
56
+ "strip_accents": null,
57
+ "tokenize_chinese_chars": true,
58
+ "tokenizer_class": "MPNetTokenizer",
59
+ "unk_token": {
60
+ "__type": "AddedToken",
61
+ "content": "[UNK]",
62
+ "lstrip": false,
63
+ "normalized": true,
64
+ "rstrip": false,
65
+ "single_word": false
66
+ }
67
+ }
vocab.txt ADDED
@@ -0,0 +1,1125 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <s>
2
+ <pad>
3
+ </s>
4
+ <unk>
5
+ [UNK]
6
+ <mask>
7
+ !
8
+ "
9
+ #
10
+ $
11
+ %
12
+ &
13
+ '
14
+ (
15
+ )
16
+ *
17
+ +
18
+ ,
19
+ -
20
+ .
21
+ /
22
+ 0
23
+ 1
24
+ 2
25
+ 3
26
+ 4
27
+ 5
28
+ 6
29
+ 7
30
+ 8
31
+ 9
32
+ :
33
+ ;
34
+ <
35
+ =
36
+ >
37
+ ?
38
+ @
39
+ [
40
+ \
41
+ ]
42
+ ^
43
+ _
44
+ `
45
+ a
46
+ b
47
+ c
48
+ d
49
+ e
50
+ f
51
+ g
52
+ h
53
+ i
54
+ j
55
+ k
56
+ l
57
+ m
58
+ n
59
+ o
60
+ p
61
+ q
62
+ r
63
+ s
64
+ t
65
+ u
66
+ v
67
+ w
68
+ x
69
+ y
70
+ z
71
+ |
72
+ }
73
+ ~
74
+ ¡
75
+ ¢
76
+ £
77
+ ¥
78
+ §
79
+ °
80
+ ±
81
+ ²
82
+ ³
83
+ ´
84
+ µ
85
+ ·
86
+ º
87
+ ½
88
+ ¿
89
+ ×
90
+ ß
91
+ æ
92
+ ð
93
+ ø
94
+ þ
95
+ đ
96
+ ħ
97
+ ı
98
+ ł
99
+ œ
100
+ ɐ
101
+ ɑ
102
+ ɒ
103
+ ɔ
104
+ ə
105
+ ɛ
106
+ ɜ
107
+ ɡ
108
+ ɢ
109
+ ɪ
110
+ ɫ
111
+ ɳ
112
+ ɽ
113
+ ɾ
114
+ ʁ
115
+ ʃ
116
+ ʊ
117
+ ʋ
118
+ ʒ
119
+ ʔ
120
+ ʕ
121
+ ʲ
122
+ ʻ
123
+ ʼ
124
+ ʾ
125
+ ʿ
126
+ ˈ
127
+ ˌ
128
+ ː
129
+ α
130
+ β
131
+ γ
132
+ δ
133
+ ε
134
+ η
135
+ θ
136
+ ι
137
+ κ
138
+ λ
139
+ μ
140
+ ν
141
+ ξ
142
+ ο
143
+ π
144
+ ρ
145
+ ς
146
+ σ
147
+ τ
148
+ υ
149
+ φ
150
+ χ
151
+ ψ
152
+ ω
153
+ а
154
+ б
155
+ в
156
+ г
157
+ д
158
+ е
159
+ ж
160
+ з
161
+ и
162
+ к
163
+ л
164
+ м
165
+ н
166
+ о
167
+ п
168
+ р
169
+ с
170
+ т
171
+ у
172
+ х
173
+ ц
174
+ ш
175
+ ъ
176
+ ы
177
+ ь
178
+ ю
179
+ я
180
+ є
181
+ א
182
+ ב
183
+ ג
184
+ ה
185
+ ו
186
+ ז
187
+ ח
188
+ י
189
+ ל
190
+ ם
191
+ מ
192
+ ן
193
+ נ
194
+ ס
195
+ ף
196
+ פ
197
+ צ
198
+ ר
199
+ ש
200
+ ת
201
+ ء
202
+ ا
203
+ ب
204
+ ة
205
+ ت
206
+ ث
207
+ ج
208
+ ح
209
+ خ
210
+ د
211
+ ذ
212
+ ر
213
+ س
214
+ ش
215
+ ص
216
+ ع
217
+ ف
218
+ ق
219
+ ك
220
+ ل
221
+ م
222
+ ن
223
+ ه
224
+ و
225
+ ي
226
+ ܐ
227
+ ܕ
228
+ ܗ
229
+ ܝ
230
+ ܠ
231
+ ܢ
232
+ ܬ
233
+
234
+
235
+
236
+
237
+
238
+
239
+
240
+
241
+
242
+
243
+
244
+
245
+
246
+
247
+
248
+
249
+
250
+
251
+ ि
252
+
253
+
254
+
255
+
256
+
257
+
258
+
259
+
260
+
261
+
262
+
263
+
264
+
265
+
266
+
267
+
268
+
269
+
270
+
271
+
272
+
273
+
274
+
275
+
276
+
277
+
278
+
279
+
280
+
281
+
282
+
283
+
284
+
285
+
286
+
287
+
288
+
289
+
290
+
291
+
292
+
293
+
294
+
295
+
296
+
297
+
298
+
299
+
300
+
301
+
302
+
303
+
304
+
305
+
306
+
307
+
308
+
309
+
310
+
311
+
312
+
313
+
314
+
315
+
316
+
317
+
318
+
319
+
320
+
321
+
322
+
323
+
324
+
325
+
326
+
327
+
328
+
329
+
330
+
331
+
332
+
333
+
334
+
335
+
336
+
337
+
338
+
339
+
340
+
341
+
342
+
343
+
344
+
345
+
346
+
347
+
348
+
349
+
350
+
351
+
352
+
353
+
354
+
355
+
356
+
357
+
358
+
359
+
360
+
361
+
362
+
363
+
364
+
365
+
366
+
367
+
368
+
369
+
370
+
371
+
372
+
373
+
374
+
375
+
376
+
377
+
378
+
379
+
380
+
381
+
382
+
383
+
384
+
385
+
386
+
387
+
388
+
389
+
390
+
391
+
392
+
393
+
394
+
395
+
396
+
397
+
398
+
399
+
400
+
401
+
402
+
403
+
404
+
405
+
406
+
407
+
408
+
409
+
410
+
411
+
412
+
413
+
414
+
415
+
416
+
417
+
418
+
419
+
420
+
421
+
422
+
423
+
424
+
425
+
426
+
427
+
428
+
429
+
430
+
431
+
432
+
433
+
434
+
435
+
436
+
437
+
438
+
439
+
440
+
441
+
442
+
443
+
444
+
445
+
446
+
447
+
448
+
449
+
450
+
451
+
452
+
453
+
454
+
455
+
456
+
457
+
458
+
459
+
460
+
461
+
462
+
463
+
464
+
465
+
466
+
467
+
468
+
469
+
470
+
471
+
472
+
473
+
474
+
475
+
476
+
477
+
478
+
479
+
480
+
481
+
482
+
483
+
484
+
485
+
486
+
487
+
488
+
489
+
490
+
491
+
492
+
493
+
494
+
495
+
496
+
497
+
498
+
499
+
500
+
501
+
502
+
503
+
504
+
505
+
506
+
507
+
508
+
509
+
510
+
511
+
512
+
513
+
514
+
515
+
516
+
517
+
518
+
519
+
520
+
521
+
522
+
523
+
524
+
525
+
526
+
527
+
528
+
529
+
530
+
531
+
532
+
533
+
534
+
535
+
536
+
537
+
538
+
539
+
540
+
541
+
542
+
543
+
544
+
545
+
546
+
547
+
548
+
549
+
550
+
551
+
552
+
553
+
554
+
555
+
556
+
557
+
558
+
559
+
560
+
561
+
562
+
563
+
564
+
565
+
566
+
567
+
568
+
569
+
570
+
571
+
572
+
573
+
574
+
575
+
576
+
577
+
578
+
579
+
580
+ 广
581
+
582
+
583
+
584
+
585
+
586
+
587
+
588
+
589
+
590
+
591
+
592
+
593
+
594
+
595
+
596
+
597
+
598
+
599
+
600
+
601
+
602
+
603
+
604
+
605
+
606
+
607
+
608
+
609
+
610
+
611
+
612
+
613
+
614
+
615
+
616
+
617
+
618
+
619
+
620
+
621
+
622
+
623
+
624
+
625
+
626
+
627
+
628
+
629
+
630
+
631
+
632
+
633
+
634
+
635
+
636
+
637
+
638
+
639
+
640
+
641
+
642
+
643
+
644
+
645
+ 殿
646
+
647
+
648
+
649
+
650
+
651
+
652
+
653
+
654
+
655
+
656
+
657
+
658
+
659
+
660
+
661
+
662
+
663
+
664
+
665
+
666
+
667
+
668
+
669
+
670
+
671
+
672
+
673
+
674
+
675
+
676
+
677
+
678
+
679
+
680
+
681
+
682
+
683
+
684
+
685
+
686
+
687
+
688
+
689
+
690
+
691
+
692
+
693
+
694
+
695
+
696
+
697
+
698
+
699
+
700
+
701
+
702
+
703
+
704
+
705
+
706
+
707
+
708
+
709
+
710
+
711
+
712
+
713
+
714
+
715
+
716
+
717
+
718
+
719
+
720
+
721
+
722
+
723
+
724
+
725
+
726
+
727
+
728
+
729
+
730
+
731
+
732
+
733
+
734
+
735
+
736
+
737
+
738
+
739
+
740
+
741
+
742
+
743
+
744
+
745
+
746
+
747
+
748
+
749
+
750
+
751
+
752
+
753
+
754
+
755
+
756
+
757
+
758
+
759
+
760
+
761
+
762
+
763
+
764
+
765
+
766
+
767
+
768
+
769
+
770
+
771
+
772
+
773
+
774
+
775
+
776
+
777
+
778
+
779
+
780
+
781
+
782
+
783
+
784
+
785
+
786
+
787
+
788
+
789
+
790
+
791
+
792
+ ##s
793
+ ##p
794
+ ##e
795
+ ##n
796
+ ##a
797
+ ##t
798
+ ##h
799
+ ##r
800
+ ##i
801
+ ##g
802
+ ##4
803
+ ##9
804
+ ##v
805
+ ##u
806
+ ##l
807
+ ##c
808
+ ##y
809
+ ##m
810
+ ##o
811
+ ##d
812
+ ##q
813
+ ##f
814
+ ##b
815
+ ##j
816
+ ##k
817
+ ##w
818
+ ##z
819
+ ##6
820
+ ##0
821
+ ##1
822
+ ##x
823
+ ##8
824
+ ##7
825
+ ##3
826
+ ##2
827
+ ##а
828
+ ##л
829
+ ##ы
830
+ ##и
831
+ ##ル
832
+ ##ハ
833
+ ##ト
834
+ ##ス
835
+ ##5
836
+ ##р
837
+ ##с
838
+ ##н
839
+ ##ɪ
840
+ ##ʃ
841
+ ##ɑ
842
+ ##ː
843
+ ##ი
844
+ ##ウ
845
+ ##ァ
846
+ ##キ
847
+ ##ュ
848
+ ##リ
849
+ ##ア
850
+ ##う
851
+ ##き
852
+ ##ł
853
+ ##ッ
854
+ ##ク
855
+ ##マ
856
+ ##ン
857
+ ##テ
858
+ ##ィ
859
+ ##ニ
860
+ ##ー
861
+ ##ل
862
+ ##ا
863
+ ##ب
864
+ ##ن
865
+ ##ล
866
+ ##ย
867
+ ##า
868
+ ##ณ
869
+ ##ม
870
+ ##ต
871
+ ##ร
872
+ ##τ
873
+ ##ι
874
+ ##β
875
+ ##เ
876
+ ##ป
877
+ ##რ
878
+ ##გ
879
+ ##ვ
880
+ ##ლ
881
+ ##ო
882
+ ##ა
883
+ ##ნ
884
+ ##ラ
885
+ ##ъ
886
+ ##к
887
+ ##в
888
+ ##đ
889
+ ##ø
890
+ ##ɾ
891
+ ##ʲ
892
+ ##ə
893
+ ##ˈ
894
+ ##ב
895
+ ##ת
896
+ ##א
897
+ ##י
898
+ ##ك
899
+ ##ر
900
+ ##د
901
+ ##っ
902
+ ##е
903
+ ##о
904
+ ##у
905
+ ##я
906
+ ##ɔ
907
+ ##ʔ
908
+ ##ذ
909
+ ##ي
910
+ ##ة
911
+ ##ს
912
+ ##ტ
913
+ ##ე
914
+ ##サ
915
+ ##た
916
+ ##し
917
+ ##の
918
+ ##す
919
+ ##な
920
+ ##ひ
921
+ ##と
922
+ ##ן
923
+ ##レ
924
+ ##チ
925
+ ##ナ
926
+ ##უ
927
+ ##ც
928
+ ##ف
929
+ ##س
930
+ ##ɐ
931
+ ##ᅦ
932
+ ##ᄃ
933
+ ##ᅩ
934
+ ##ᆨ
935
+ ##ᄅ
936
+ ##ᅵ
937
+ ##ᆸ
938
+ ##ᄇ
939
+ ##ᅧ
940
+ ##ᆼ
941
+ ##ᄋ
942
+ ##ᆫ
943
+ ##ᅢ
944
+ ##ε
945
+ ##ρ
946
+ ##α
947
+ ##ς
948
+ ##ش
949
+ ##م
950
+ ##و
951
+ ##フ
952
+ ##ロ
953
+ ##ð
954
+ ##ხ
955
+ ##3
956
+ ##æ
957
+ ##ল
958
+ ##ɡ
959
+ ##ع
960
+ ##π
961
+ ##κ
962
+ ##ο
963
+ ##ق
964
+ ##ت
965
+ ##ɒ
966
+ ##χ
967
+ ##λ
968
+ ##ภ
969
+ ##ด
970
+ ##п
971
+ ##г
972
+ ##れ
973
+ ##る
974
+ ##פ
975
+ ##ה
976
+ ##ा
977
+ ##न
978
+ ##ਲ
979
+ ##ਹ
980
+ ##ɛ
981
+ ##ʊ
982
+ ##ᅮ
983
+ ##は
984
+ ##り
985
+ ##く
986
+ ##あ
987
+ ##ν
988
+ ##μ
989
+ ##อ
990
+ ##ก
991
+ ##ว
992
+ ##ܕ
993
+ ##ܝ
994
+ ##ܢ
995
+ ##ܬ
996
+ ##ォ
997
+ ##ه
998
+ ##з
999
+ ##シ
1000
+ ##მ
1001
+ ##წ
1002
+ ##ფ
1003
+ ##つ
1004
+ ##か
1005
+ ##ค
1006
+ ##ण
1007
+ ##ई
1008
+ ##ξ
1009
+ ##も
1010
+ ##み
1011
+ ##д
1012
+ ##ж
1013
+ ##т
1014
+ ##व
1015
+ ##द
1016
+ ##ह
1017
+ ##ि
1018
+ ##���
1019
+ ##ω
1020
+ ##お
1021
+ ##ʻ
1022
+ ##ซ
1023
+ ##せ
1024
+ ##ん
1025
+ ##œ
1026
+ ##こ
1027
+ ##ら
1028
+ ##া
1029
+ ##হ
1030
+ ##η
1031
+ ##ß
1032
+ ##ჱ
1033
+ ##ı
1034
+ ##ث
1035
+ ##ᵻ
1036
+ ##υ
1037
+ ##θ
1038
+ ##ɽ
1039
+ ##ょ
1040
+ ##に
1041
+ ##γ
1042
+ ##を
1043
+ ##พ
1044
+ ##わ
1045
+ ##い
1046
+ ##ш
1047
+ ##თ
1048
+ ##め
1049
+ ##カ
1050
+ ##ʿ
1051
+ ##ר
1052
+ ##ם
1053
+ ##ჲ
1054
+ ##ネ
1055
+ ##ョ
1056
+ ##ψ
1057
+ ##ち
1058
+ ##ゃ
1059
+ ##σ
1060
+ ##დ
1061
+ ##र
1062
+ ##タ
1063
+ ##ム
1064
+ ##ェ
1065
+ ##ء
1066
+ ##ל
1067
+ ##ɫ
1068
+ ##х
1069
+ ##ᅡ
1070
+ ##ᆯ
1071
+ ##ゥ
1072
+ ##イ
1073
+ ##ฮ
1074
+ ##ง
1075
+ ##ไ
1076
+ ##ช
1077
+ ##แ
1078
+ ##ग
1079
+ ##خ
1080
+ ##ま
1081
+ ##ノ
1082
+ ##ס
1083
+ ##ャ
1084
+ ##モ
1085
+ ##ल
1086
+ ##ו
1087
+ ##ح
1088
+ ##ц
1089
+ ##ь
1090
+ ##ף
1091
+ ##ള
1092
+ ##δ
1093
+ ##ਾ
1094
+ ##м
1095
+ ##ษ
1096
+ ##ฐ
1097
+ ##ാ
1098
+ ##ഹ
1099
+ ##ツ
1100
+ ##セ
1101
+ ##オ
1102
+ ##ʒ
1103
+ ##ქ
1104
+ ##ю
1105
+ ##ʁ
1106
+ ##ˌ
1107
+ ##स
1108
+ ##ص
1109
+ ##º
1110
+ ##エ
1111
+ ##ミ
1112
+ ##ש
1113
+ ##מ
1114
+ ##צ
1115
+ ##ɜ
1116
+ ##ܠ
1117
+ ##ܗ
1118
+ ##ܐ
1119
+ ##ะ
1120
+ ##น
1121
+ ##є
1122
+ ##ゆ
1123
+ ##ɳ
1124
+ ##נ
1125
+ ##ჳ