Chhabi commited on
Commit
bc2c762
1 Parent(s): 0ae48c2

Fine-tuned tokenizer with generation hyperparameters

Browse files
Files changed (2) hide show
  1. tokenizer.json +2 -2
  2. tokenizer_config.json +2 -1
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f73cbd2b4371a62ef7fa742e0a4650848022fe1ef073f5fbab9055909bfe87f
3
- size 16315311
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2f3270c4527f39178d6195ec802925c6b371fb910c2488f9e99d02a7e21d82a
3
+ size 16315412
tokenizer_config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<pad>",
@@ -30,7 +31,7 @@
30
  "eos_token": "</s>",
31
  "extra_ids": 0,
32
  "legacy": true,
33
- "max_length": 512,
34
  "model_max_length": 1000000000000000019884624838656,
35
  "pad_token": "<pad>",
36
  "sp_model_kwargs": {},
 
1
  {
2
+ "add_prefix_space": true,
3
  "added_tokens_decoder": {
4
  "0": {
5
  "content": "<pad>",
 
31
  "eos_token": "</s>",
32
  "extra_ids": 0,
33
  "legacy": true,
34
+ "max_length": 256,
35
  "model_max_length": 1000000000000000019884624838656,
36
  "pad_token": "<pad>",
37
  "sp_model_kwargs": {},