sanchit-gandhi HF staff commited on
Commit
2ad1599
1 Parent(s): f9b9b93

fix optimum

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -7,6 +7,7 @@ import time
7
  import os
8
 
9
  BATCH_SIZE = 16
 
10
  TOKEN = os.environ.get("HF_TOKEN", None)
11
 
12
  device = "cuda:0" if torch.cuda.is_available() else "cpu"
@@ -21,8 +22,8 @@ distilled_model = AutoModelForSpeechSeq2Seq.from_pretrained(
21
  )
22
 
23
  if not use_flash_attention_2:
24
- model = model.bettertransformer()
25
- distilled_model = distilled_model.bettertransformer()
26
 
27
  processor = AutoProcessor.from_pretrained("openai/whisper-tiny.en")
28
 
 
7
  import os
8
 
9
  BATCH_SIZE = 16
10
+ # TODO: remove token before release
11
  TOKEN = os.environ.get("HF_TOKEN", None)
12
 
13
  device = "cuda:0" if torch.cuda.is_available() else "cpu"
 
22
  )
23
 
24
  if not use_flash_attention_2:
25
+ model = model.to_bettertransformer()
26
+ distilled_model = distilled_model.to_bettertransformer()
27
 
28
  processor = AutoProcessor.from_pretrained("openai/whisper-tiny.en")
29