quantumaikr commited on
Commit
e48a606
1 Parent(s): 267c155

Upload tokenizer

Browse files
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[PAD]": 32000
3
+ }
special_tokens_map.json CHANGED
@@ -13,6 +13,7 @@
13
  "rstrip": false,
14
  "single_word": false
15
  },
 
16
  "unk_token": {
17
  "content": "",
18
  "lstrip": false,
 
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
+ "pad_token": "[PAD]",
17
  "unk_token": {
18
  "content": "",
19
  "lstrip": false,
tokenizer_config.json CHANGED
@@ -18,8 +18,9 @@
18
  "rstrip": false,
19
  "single_word": false
20
  },
21
- "model_max_length": 1000000000000000019884624838656,
22
  "pad_token": null,
 
23
  "sp_model_kwargs": {},
24
  "tokenizer_class": "LlamaTokenizer",
25
  "unk_token": {
 
18
  "rstrip": false,
19
  "single_word": false
20
  },
21
+ "model_max_length": 512,
22
  "pad_token": null,
23
+ "padding_side": "right",
24
  "sp_model_kwargs": {},
25
  "tokenizer_class": "LlamaTokenizer",
26
  "unk_token": {