camparchimedes commited on
Commit
49351f8
·
verified ·
1 Parent(s): 77f2e6a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -4
app.py CHANGED
@@ -68,9 +68,7 @@ def convert_to_wav(audio_file):
68
  # @spaces.GPU(duration=300, queue=False)
69
  # Set distinct pad and eos tokens
70
  if processor.tokenizer.pad_token_id is None:
71
- processor.tokenizer.pad_token_id = processor.tokenizer.convert_tokens_to_ids("[PAD]")
72
- if processor.tokenizer.eos_token_id is None:
73
- processor.tokenizer.eos_token_id = processor.tokenizer.convert_tokens_to_ids("[EOS]")
74
 
75
  def transcribe_audio(audio_file, batch_size=4):
76
  start_time = time.time()
@@ -92,7 +90,7 @@ def transcribe_audio(audio_file, batch_size=4):
92
  inputs.input_features,
93
  max_length=2048,
94
  num_beams=8,
95
- task="transcribe",
96
  attention_mask=attention_mask,
97
  language="no",
98
  pad_token_id=processor.tokenizer.pad_token_id,
 
68
  # @spaces.GPU(duration=300, queue=False)
69
  # Set distinct pad and eos tokens
70
  if processor.tokenizer.pad_token_id is None:
71
+ processor.tokenizer.pad_token_id = processor.tokenizer.eos_token_id + 1
 
 
72
 
73
  def transcribe_audio(audio_file, batch_size=4):
74
  start_time = time.time()
 
90
  inputs.input_features,
91
  max_length=2048,
92
  num_beams=8,
93
+ # task="transcribe",
94
  attention_mask=attention_mask,
95
  language="no",
96
  pad_token_id=processor.tokenizer.pad_token_id,