Looks like the decoder start token should actually be 0
Browse files
README.md
CHANGED
@@ -447,7 +447,7 @@ input_ids = tokenizer(text, return_tensors="pt").input_ids
|
|
447 |
outputs = model.generate(
|
448 |
input_ids=input_ids,
|
449 |
generation_config=GenerationConfig(
|
450 |
-
decoder_start_token_id=
|
451 |
))
|
452 |
|
453 |
tokenizer.decode(outputs[0], skip_special_tokens=True)
|
|
|
447 |
outputs = model.generate(
|
448 |
input_ids=input_ids,
|
449 |
generation_config=GenerationConfig(
|
450 |
+
decoder_start_token_id=0,
|
451 |
))
|
452 |
|
453 |
tokenizer.decode(outputs[0], skip_special_tokens=True)
|