Xenova
/

esm2_t30_150M_UR50D

Transformers.js

Model card Files Files and versions Community

Xenova HF staff commited on Dec 10, 2023

Commit

a212657

•

1 Parent(s): d600498

Upload tokenizer.json

Files changed (1) hide show

tokenizer.json +57 -6

tokenizer.json CHANGED Viewed

@@ -2,7 +2,62 @@
   "version": "1.0",
   "truncation": null,
   "padding": null,
-  "added_tokens": [],
   "normalizer": null,
   "pre_tokenizer": {
     "type": "BertPreTokenizer"
@@ -64,11 +119,7 @@
       }
     }
   },
-  "decoder": {
-    "type": "WordPiece",
-    "prefix": "",
-    "cleanup": true
-  },
   "model": {
     "type": "WordPiece",
     "unk_token": "<unk>",

   "version": "1.0",
   "truncation": null,
   "padding": null,
+  "added_tokens": [
+    {
+      "id": 0,
+      "content": "<cls>",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 1,
+      "content": "<pad>",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 2,
+      "content": "<eos>",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 3,
+      "content": "<unk>",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 31,
+      "content": "<null_1>",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 32,
+      "content": "<mask>",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    }
+  ],
   "normalizer": null,
   "pre_tokenizer": {
     "type": "BertPreTokenizer"
       }
     }
   },
+  "decoder": null,
   "model": {
     "type": "WordPiece",
     "unk_token": "<unk>",