Reverb-ASR

Sleeping

ndelworth08 commited on Sep 16

Commit

6458569

•

1 Parent(s): bb47424

switching verbatimicity parameter name

Files changed (1) hide show

app.py CHANGED Viewed

@@ -45,29 +45,30 @@ def recognition(audio, style=0):
         return "Input Error! Please enter one audio!"
     # NOTE: model supports 16k sample_rate
-    cat_embs = ','.join([str(s) for s in (1-style, style)])
     cat_embs = process_cat_embs(cat_embs)
     ans = model.transcribe(audio, cat_embs = cat_embs)
     if ans is None:
         return "ERROR! No text output! Please try again!"
     txt = ans['text']
     return txt
 # input
 inputs = [
     gr.inputs.Audio(source="microphone", type="filepath", label='Input audio'),
-    gr.Slider(0, 1, value=0, label="Style - from verbatim (0) to non-verbatim (1)", info="Choose between verbatim and NV"),
 ]
 output = gr.outputs.Textbox(label="Output Text")
-text = "Reginald Demo"
 # description
 description = (
-    "This is a speech recognition demo that supports verbatim and non-verbatim transcription. Try recording an audio with disfluencies (ex: \'uh\', \'um\') and testing both transcription styles."  # noqa
 )
 article = (

         return "Input Error! Please enter one audio!"
     # NOTE: model supports 16k sample_rate
+    cat_embs = ','.join([str(s) for s in (style, 1-style)])
     cat_embs = process_cat_embs(cat_embs)
     ans = model.transcribe(audio, cat_embs = cat_embs)
     if ans is None:
         return "ERROR! No text output! Please try again!"
     txt = ans['text']
+    txt = txt.replace('▁', ' ')
     return txt
 # input
 inputs = [
     gr.inputs.Audio(source="microphone", type="filepath", label='Input audio'),
+    gr.Slider(0, 1, value=0, label="Verbatimicity - from non-verbatim (0) to verbatim (1)", info="Choose a transcription style between non-verbatim and verbatim"),
 ]
 output = gr.outputs.Textbox(label="Output Text")
+text = "Reginald Transcription Styles Demo"
 # description
 description = (
+    "Reginald supports verbatim and non-verbatim transcription. Try recording an audio with disfluencies (ex: \'uh\', \'um\') and testing both transcription styles."  # noqa
 )
 article = (