Upload tokenizer

Files changed (4) hide show

source.spm CHANGED Viewed

Binary files a/source.spm and b/source.spm differ

target.spm CHANGED Viewed

Binary files a/target.spm and b/target.spm differ

tokenizer_config.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "added_tokens_decoder": {
-    "0": {
       "content": "</s>",
       "lstrip": false,
       "normalized": false,
@@ -8,7 +8,7 @@
       "single_word": false,
       "special": true
     },
-    "1": {
       "content": "<unk>",
       "lstrip": false,
       "normalized": false,
@@ -16,7 +16,7 @@
       "single_word": false,
       "special": true
     },
-    "62388": {
       "content": "<pad>",
       "lstrip": false,
       "normalized": false,

 {
   "added_tokens_decoder": {
+    "43741": {
       "content": "</s>",
       "lstrip": false,
       "normalized": false,
       "single_word": false,
       "special": true
     },
+    "52508": {
       "content": "<unk>",
       "lstrip": false,
       "normalized": false,
       "single_word": false,
       "special": true
     },
+    "57059": {
       "content": "<pad>",
       "lstrip": false,
       "normalized": false,

vocab.json CHANGED Viewed

The diff for this file is too large to render. See raw diff