jonatanklosko commited on
Commit
3e95818
1 Parent(s): 8852c40

Move <|endoftext|> from added_tokens.json to vocab.json

Browse files
Files changed (3) hide show
  1. added_tokens.json +0 -1
  2. tokenizer.json +2 -1
  3. vocab.json +1 -0
added_tokens.json CHANGED
@@ -17,7 +17,6 @@
17
  "<|da|>": 50285,
18
  "<|de|>": 50261,
19
  "<|el|>": 50281,
20
- "<|endoftext|>": 50257,
21
  "<|en|>": 50259,
22
  "<|es|>": 50262,
23
  "<|et|>": 50307,
 
17
  "<|da|>": 50285,
18
  "<|de|>": 50261,
19
  "<|el|>": 50281,
 
20
  "<|en|>": 50259,
21
  "<|es|>": 50262,
22
  "<|et|>": 50307,
tokenizer.json CHANGED
@@ -51334,7 +51334,8 @@
51334
  "ĠPakistani": 50253,
51335
  "Ġ('": 50254,
51336
  "åľº": 50255,
51337
- "": 50256
 
51338
  },
51339
  "merges": [
51340
  "Ġ a",
 
51334
  "ĠPakistani": 50253,
51335
  "Ġ('": 50254,
51336
  "åľº": 50255,
51337
+ "": 50256,
51338
+ "<|endoftext|>": 50257
51339
  },
51340
  "merges": [
51341
  "Ġ a",
vocab.json CHANGED
@@ -1,5 +1,6 @@
1
  {
2
  "": 50256,
 
3
  "!": 0,
4
  "!!": 1432,
5
  "!!!": 4589,
 
1
  {
2
  "": 50256,
3
+ "<|endoftext|>": 50257,
4
  "!": 0,
5
  "!!": 1432,
6
  "!!!": 4589,