Spaces:
Runtime error
Runtime error
Commit
•
9e35e59
1
Parent(s):
0f704ae
Update app.py
Browse files
app.py
CHANGED
@@ -6,8 +6,6 @@ import time
|
|
6 |
import os
|
7 |
|
8 |
BATCH_SIZE = 16
|
9 |
-
# TODO: remove token before release and update ckpt path
|
10 |
-
TOKEN = os.environ.get("HF_TOKEN", None)
|
11 |
|
12 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
13 |
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
|
@@ -17,7 +15,7 @@ model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
|
17 |
"openai/whisper-large-v2", torch_dtype=torch_dtype, low_cpu_mem_usage=True, use_safetensors=True, use_flash_attention_2=use_flash_attention_2
|
18 |
)
|
19 |
distilled_model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
20 |
-
"
|
21 |
)
|
22 |
|
23 |
if not use_flash_attention_2:
|
|
|
6 |
import os
|
7 |
|
8 |
BATCH_SIZE = 16
|
|
|
|
|
9 |
|
10 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
11 |
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
|
|
|
15 |
"openai/whisper-large-v2", torch_dtype=torch_dtype, low_cpu_mem_usage=True, use_safetensors=True, use_flash_attention_2=use_flash_attention_2
|
16 |
)
|
17 |
distilled_model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
18 |
+
"distil-whisper/distil-large-v2", torch_dtype=torch_dtype, low_cpu_mem_usage=True, use_safetensors=True, use_flash_attention_2=use_flash_attention_2, token=TOKEN
|
19 |
)
|
20 |
|
21 |
if not use_flash_attention_2:
|