Matthijs Hollemans commited on
Commit
f539e6d
1 Parent(s): 1bb7c1d

add a demo song

Browse files
Files changed (2) hide show
  1. app.py +3 -1
  2. examples/beos_song.mp3 +3 -0
app.py CHANGED
@@ -111,7 +111,7 @@ def predict(audio_path):
111
  title = "Word-level timestamps with Whisper"
112
 
113
  description = """
114
- This demo shows Whisper <b>word-level timestamps</b> in action using Hugging Face Transformers. It creates a video showing subtitled audio with the current word highlighted.
115
 
116
  This demo uses the <b>openai/whisper-small</b> checkpoint. Since it's only a demo, the output is limited to the first 60 seconds of audio.
117
  """
@@ -125,6 +125,7 @@ article = """
125
  <li>Shakespeare's "Henry V" speech from <a href="https://freesound.org/people/acclivity/sounds/24096/">acclivity</a> (CC BY-NC 4.0 license)
126
  <li>"Here's to the Crazy Ones" speech by Steve Jobs</li>
127
  <li>"Stupid People" comedy routine by Bill Engvall</li>
 
128
  <li>Lato font by Łukasz Dziedzic (licensed under Open Font License)</li>
129
  <li>Whisper model by OpenAI</li>
130
  </ul>
@@ -136,6 +137,7 @@ examples = [
136
  "examples/steve_jobs_crazy_ones.mp3",
137
  "examples/henry5.wav",
138
  "examples/stupid_people.mp3",
 
139
  ]
140
 
141
  gr.Interface(
 
111
  title = "Word-level timestamps with Whisper"
112
 
113
  description = """
114
+ This demo shows Whisper <b>word-level timestamps</b> in action using Hugging Face Transformers. It creates a video showing subtitled audio with the current word highlighted. It can even do music lyrics!
115
 
116
  This demo uses the <b>openai/whisper-small</b> checkpoint. Since it's only a demo, the output is limited to the first 60 seconds of audio.
117
  """
 
125
  <li>Shakespeare's "Henry V" speech from <a href="https://freesound.org/people/acclivity/sounds/24096/">acclivity</a> (CC BY-NC 4.0 license)
126
  <li>"Here's to the Crazy Ones" speech by Steve Jobs</li>
127
  <li>"Stupid People" comedy routine by Bill Engvall</li>
128
+ <li>"BeOS, It's The OS" song by The Cotton Squares</li>
129
  <li>Lato font by Łukasz Dziedzic (licensed under Open Font License)</li>
130
  <li>Whisper model by OpenAI</li>
131
  </ul>
 
137
  "examples/steve_jobs_crazy_ones.mp3",
138
  "examples/henry5.wav",
139
  "examples/stupid_people.mp3",
140
+ "examples/beos_song.mp3",
141
  ]
142
 
143
  gr.Interface(
examples/beos_song.mp3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a9a0df5dba8bfd3f4dcc895d98f03552ac4220e7fb30267c20448d33684410b
3
+ size 1245689