mrodriguez commited on
Commit
dfb8f1c
1 Parent(s): 159e927

feat(app): add example and small mods

Browse files
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ *.wav filter=lfs diff=lfs merge=lfs -text
app.py CHANGED
@@ -20,16 +20,14 @@ ACCEPTED_LANGUAGE_BEHAVIOUR = [
20
 
21
 
22
  def transcribe(
23
- audio_url: str = None,
24
  audio: str = None,
25
- video: str = None,
26
  language_behaviour: str = ACCEPTED_LANGUAGE_BEHAVIOUR[2],
27
  language: str = "english",
28
  ) -> dict:
29
  """
30
  This function transcribes audio to text using the Gladia API.
31
  It sends a request to the API with the given audio file or audio URL, and returns the transcribed text.
32
- Find your api key at gladia.io
33
 
34
  Parameters:
35
  audio_url (str): The URL of the audio file to transcribe. If audio_url is provided, audio file will be ignored.
@@ -58,10 +56,6 @@ def transcribe(
58
  "language_behaviour": (None, language_behaviour),
59
  }
60
 
61
- # priority given to the video
62
- if video:
63
- audio = video
64
-
65
  # priority given to the audio or video
66
  if audio:
67
  files["audio"] = (audio, open(audio, "rb"), "audio/wav")
@@ -107,25 +101,16 @@ def transcribe(
107
  iface = gr.Interface(
108
  title="Gladia.io fast audio transcription",
109
  description="""Gladia.io Whisper large-v2 fast audio transcription API
110
- is able to perform fast audio transcription for any audio / video or url format.<br/><br/>
111
- However it's prefered for faster performance to provide <br/>
112
- wav 16KHz with 16b encoding (pcm_u16be) to avoid further the conversion time.<br/>
113
- "automatic single language" language discovery behavior may also<br/>
114
- slow down (just a little bit - talking about ms) the process.
115
- <br/>
116
- Here is a benchmark ran on multiple Speech-To-Text providers
117
- ![Benchmarks](https://storage.gra.cloud.ovh.net/v1/AUTH_90df0bdc74f749ce86783e6550b1e4aa/public-files/benchmark.png)<br/>
118
- Join our [Slack](https://gladia-io.slack.com) to discuss with us.<br/><br/>
119
- Get your own API key on [Gladia.io](https://gladia.io/) during free alpha
120
  """,
121
  fn=transcribe,
122
  inputs=[
123
- gr.Textbox(
124
- lines=1,
125
- label="Audio/Video url to transcribe",
126
- ),
127
  gr.Audio(label="or Audio file to transcribe", source="upload", type="filepath"),
128
- gr.Video(label="or Video file to transcribe", source="upload", type="filepath"),
129
  gr.Dropdown(
130
  label="""Language transcription behaviour:\n
131
  If "manual", the language field must be provided and the API will transcribe the audio in the given language.
@@ -144,6 +129,10 @@ iface = gr.Interface(
144
  ),
145
  ],
146
  outputs="json",
 
 
 
 
147
  )
148
  iface.queue()
149
  iface.launch()
 
20
 
21
 
22
  def transcribe(
 
23
  audio: str = None,
 
24
  language_behaviour: str = ACCEPTED_LANGUAGE_BEHAVIOUR[2],
25
  language: str = "english",
26
  ) -> dict:
27
  """
28
  This function transcribes audio to text using the Gladia API.
29
  It sends a request to the API with the given audio file or audio URL, and returns the transcribed text.
30
+ Get your api key at gladia.io !
31
 
32
  Parameters:
33
  audio_url (str): The URL of the audio file to transcribe. If audio_url is provided, audio file will be ignored.
 
56
  "language_behaviour": (None, language_behaviour),
57
  }
58
 
 
 
 
 
59
  # priority given to the audio or video
60
  if audio:
61
  files["audio"] = (audio, open(audio, "rb"), "audio/wav")
 
101
  iface = gr.Interface(
102
  title="Gladia.io fast audio transcription",
103
  description="""Gladia.io Whisper large-v2 fast audio transcription API
104
+ is able to perform fast audio transcriptions for any audio / video.
105
+ For more details and a benchmark ran on multiple Speech-To-Text providers, please visit
106
+ [our post](https://medium.com/@gladia.io/gladia-alpha-launch-redefining-what-s-possible-with-speech-to-text-ai-686dd4312a86) on Medium.
107
+ <br/><br/>
108
+ You are more than welcome to join our [Slack](https://gladia-io.slack.com) to discuss with us
109
+ and also don't forget to get your own API key on [Gladia.io](https://gladia.io/) during the free alpha !
 
 
 
 
110
  """,
111
  fn=transcribe,
112
  inputs=[
 
 
 
 
113
  gr.Audio(label="or Audio file to transcribe", source="upload", type="filepath"),
 
114
  gr.Dropdown(
115
  label="""Language transcription behaviour:\n
116
  If "manual", the language field must be provided and the API will transcribe the audio in the given language.
 
129
  ),
130
  ],
131
  outputs="json",
132
+ examples=[
133
+ ["examples/good.will.hunting.wav", ACCEPTED_LANGUAGE_BEHAVIOUR[1], "english"],
134
+ ["examples/wolf.of.wall.street.wav", ACCEPTED_LANGUAGE_BEHAVIOUR[1], "english"],
135
+ ],
136
  )
137
  iface.queue()
138
  iface.launch()
examples/good.will.hunting.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:981492667ceb174e8a5d272ed68ad0a5198d98d836ff955b5e3b45d105d2a422
3
+ size 14251502
examples/wolf.of.wall.street.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da1283c0fa5e3829a7f6630c17d73647e494c39fc56f0eec8331ffaf0df23162
3
+ size 1601526