boris commited on
Commit
8bb2236
1 Parent(s): bc01f78

feat: output_length considers bos and eos

Browse files
Files changed (1) hide show
  1. seq2seq/run_seq2seq_flax.py +1 -1
seq2seq/run_seq2seq_flax.py CHANGED
@@ -82,7 +82,7 @@ MODEL_TYPES = tuple(conf.model_type for conf in MODEL_CONFIG_CLASSES)
82
 
83
  # Model hyperparameters, for convenience
84
  OUTPUT_VOCAB_SIZE = 16384 + 1 # encoded image token space + 1 for bos
85
- OUTPUT_LENGTH = 256 + 1 # number of encoded tokens + 1 for bos
86
  BOS_TOKEN_ID = 16384
87
  BASE_MODEL = 'facebook/bart-large-cnn'
88
 
 
82
 
83
  # Model hyperparameters, for convenience
84
  OUTPUT_VOCAB_SIZE = 16384 + 1 # encoded image token space + 1 for bos
85
+ OUTPUT_LENGTH = 256 + 2 # number of encoded tokens + 1 for bos + 1 for eos
86
  BOS_TOKEN_ID = 16384
87
  BASE_MODEL = 'facebook/bart-large-cnn'
88