Upload tokenizer
Browse files- tokenizer.json +1 -1
- tokenizer_config.json +1 -1
tokenizer.json
CHANGED
@@ -53,7 +53,7 @@
|
|
53 |
"type": "BertNormalizer",
|
54 |
"clean_text": true,
|
55 |
"handle_chinese_chars": false,
|
56 |
-
"strip_accents":
|
57 |
"lowercase": false
|
58 |
},
|
59 |
"pre_tokenizer": {
|
|
|
53 |
"type": "BertNormalizer",
|
54 |
"clean_text": true,
|
55 |
"handle_chinese_chars": false,
|
56 |
+
"strip_accents": true,
|
57 |
"lowercase": false
|
58 |
},
|
59 |
"pre_tokenizer": {
|
tokenizer_config.json
CHANGED
@@ -9,7 +9,7 @@
|
|
9 |
"never_split": null,
|
10 |
"pad_token": "[PAD]",
|
11 |
"sep_token": "[SEP]",
|
12 |
-
"strip_accents":
|
13 |
"tokenize_chinese_chars": false,
|
14 |
"tokenizer_class": "BertTokenizer",
|
15 |
"unk_token": "[UNK]"
|
|
|
9 |
"never_split": null,
|
10 |
"pad_token": "[PAD]",
|
11 |
"sep_token": "[SEP]",
|
12 |
+
"strip_accents": true,
|
13 |
"tokenize_chinese_chars": false,
|
14 |
"tokenizer_class": "BertTokenizer",
|
15 |
"unk_token": "[UNK]"
|