peyash
/

distilbert-base-multilingual-cased

Model card Files Files and versions Community

peyash commited on Feb 2

Commit

72dceeb

•

1 Parent(s): d598696

Upload tokenizer

Files changed (2) hide show

special_tokens_map.json +5 -0
tokenizer.json +27 -0

special_tokens_map.json CHANGED Viewed

@@ -1,4 +1,9 @@
 {
   "cls_token": "[CLS]",
   "mask_token": "[MASK]",
   "pad_token": "[PAD]",

 {
+  "additional_special_tokens": [
+    "[DE]",
+    "[FR]",
+    "[ES]"
+  ],
   "cls_token": "[CLS]",
   "mask_token": "[MASK]",
   "pad_token": "[PAD]",

tokenizer.json CHANGED Viewed

@@ -12,6 +12,33 @@
       "normalized": false,
       "special": true
     },
     {
       "id": 100,
       "content": "[UNK]",

       "normalized": false,
       "special": true
     },
+    {
+      "id": 1,
+      "content": "[ES]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 2,
+      "content": "[DE]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 3,
+      "content": "[FR]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
     {
       "id": 100,
       "content": "[UNK]",