duraad commited on
Commit
1bf0497
1 Parent(s): ee42a37

Upload tokenizer

Browse files
Files changed (2) hide show
  1. tokenizer.json +2 -2
  2. tokenizer_config.json +4 -0
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6159d7ec2f2ff06356659536274e669822a98188a9cf7f009f92a264ab5abf4
3
- size 16330559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fabeeba8c57563ba6a0a37b67dc2bf3b451983d3ee33814230168ac966c1cad
3
+ size 16315311
tokenizer_config.json CHANGED
@@ -30,9 +30,13 @@
30
  "eos_token": "</s>",
31
  "extra_ids": 0,
32
  "legacy": true,
 
33
  "model_max_length": 1000000000000000019884624838656,
34
  "pad_token": "<pad>",
35
  "sp_model_kwargs": {},
 
36
  "tokenizer_class": "T5Tokenizer",
 
 
37
  "unk_token": "<unk>"
38
  }
 
30
  "eos_token": "</s>",
31
  "extra_ids": 0,
32
  "legacy": true,
33
+ "max_length": 512,
34
  "model_max_length": 1000000000000000019884624838656,
35
  "pad_token": "<pad>",
36
  "sp_model_kwargs": {},
37
+ "stride": 0,
38
  "tokenizer_class": "T5Tokenizer",
39
+ "truncation_side": "right",
40
+ "truncation_strategy": "longest_first",
41
  "unk_token": "<unk>"
42
  }