Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -68,9 +68,7 @@ def convert_to_wav(audio_file):
|
|
68 |
# @spaces.GPU(duration=300, queue=False)
|
69 |
# Set distinct pad and eos tokens
|
70 |
if processor.tokenizer.pad_token_id is None:
|
71 |
-
processor.tokenizer.pad_token_id = processor.tokenizer.
|
72 |
-
if processor.tokenizer.eos_token_id is None:
|
73 |
-
processor.tokenizer.eos_token_id = processor.tokenizer.convert_tokens_to_ids("[EOS]")
|
74 |
|
75 |
def transcribe_audio(audio_file, batch_size=4):
|
76 |
start_time = time.time()
|
@@ -92,7 +90,7 @@ def transcribe_audio(audio_file, batch_size=4):
|
|
92 |
inputs.input_features,
|
93 |
max_length=2048,
|
94 |
num_beams=8,
|
95 |
-
task="transcribe",
|
96 |
attention_mask=attention_mask,
|
97 |
language="no",
|
98 |
pad_token_id=processor.tokenizer.pad_token_id,
|
|
|
68 |
# @spaces.GPU(duration=300, queue=False)
|
69 |
# Set distinct pad and eos tokens
|
70 |
if processor.tokenizer.pad_token_id is None:
|
71 |
+
processor.tokenizer.pad_token_id = processor.tokenizer.eos_token_id + 1
|
|
|
|
|
72 |
|
73 |
def transcribe_audio(audio_file, batch_size=4):
|
74 |
start_time = time.time()
|
|
|
90 |
inputs.input_features,
|
91 |
max_length=2048,
|
92 |
num_beams=8,
|
93 |
+
# task="transcribe",
|
94 |
attention_mask=attention_mask,
|
95 |
language="no",
|
96 |
pad_token_id=processor.tokenizer.pad_token_id,
|