main-horse commited on
Commit
87b071d
1 Parent(s): 9383ec6

Upload tokenizer

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +3 -1
tokenizer_config.json CHANGED
@@ -1,9 +1,11 @@
1
  {
2
  "add_prefix_space": false,
 
3
  "bos_token": "<|endoftext|>",
4
  "clean_up_tokenization_spaces": true,
 
5
  "eos_token": "<|endoftext|>",
6
- "model_max_length": 2048,
7
  "tokenizer_class": "GPTNeoXTokenizer",
8
  "unk_token": "<|endoftext|>"
9
  }
 
1
  {
2
  "add_prefix_space": false,
3
+ "boi_token": "<info>",
4
  "bos_token": "<|endoftext|>",
5
  "clean_up_tokenization_spaces": true,
6
+ "eoi_token": "</info>",
7
  "eos_token": "<|endoftext|>",
8
+ "model_max_length": 9999999,
9
  "tokenizer_class": "GPTNeoXTokenizer",
10
  "unk_token": "<|endoftext|>"
11
  }