Spaces:

ysharma
/

Voice-to-jokes

Runtime error

ysharma HF staff commited on Oct 8, 2022

Commit

cd49d70

•

1 Parent(s): a18abb2

update

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,9 +3,6 @@ os.system("pip install git+https://github.com/openai/whisper.git")
 os.system("pip install neon-tts-plugin-coqui==0.6.0")
 import gradio as gr
 import whisper
-#import os
-#import gradio as gr
 import requests
 import tempfile
 from neon_tts_plugin_coqui import CoquiTTS
@@ -15,9 +12,7 @@ from datasets import load_dataset
 dataset = load_dataset("ysharma/short_jokes")
 # Language common in both the multilingual models - English, Chinese, Spanish, and French etc
-# So it would make sense to test the App on these four prominently
-# Whisper: Speech-to-text
 model = whisper.load_model("base")
 #model_med = whisper.load_model("medium")
 # Languages covered in Whisper - (exhaustive list) :
@@ -43,7 +38,7 @@ model = whisper.load_model("base")
 #"ln": "lingala", "ha": "hausa", "ba": "bashkir", "jw": "javanese", "su": "sundanese",
-# Text-to-Speech
 LANGUAGES = list(CoquiTTS.langs.keys())
 coquiTTS = CoquiTTS()
 print(f"Languages for Coqui are: {LANGUAGES}")
@@ -89,7 +84,7 @@ def whisper_stt(audio):
   #options_transc = whisper.DecodingOptions(fp16 = False, language=lang, task='transcribe') #lang
   options_transl = whisper.DecodingOptions(fp16 = False, language='en', task='translate') #lang
   #result_transc = whisper.decode(model_med, mel, options_transc)
-  result_transl = whisper.decode(model_med, mel, options_transl)
   # print the recognized text
   #print(f"transcript is : {result_transc.text}")

 os.system("pip install neon-tts-plugin-coqui==0.6.0")
 import gradio as gr
 import whisper
 import requests
 import tempfile
 from neon_tts_plugin_coqui import CoquiTTS
 dataset = load_dataset("ysharma/short_jokes")
 # Language common in both the multilingual models - English, Chinese, Spanish, and French etc
+# /model 1: Whisper: Speech-to-text
 model = whisper.load_model("base")
 #model_med = whisper.load_model("medium")
 # Languages covered in Whisper - (exhaustive list) :
 #"ln": "lingala", "ha": "hausa", "ba": "bashkir", "jw": "javanese", "su": "sundanese",
+#Model 2:  Text-to-Speech
 LANGUAGES = list(CoquiTTS.langs.keys())
 coquiTTS = CoquiTTS()
 print(f"Languages for Coqui are: {LANGUAGES}")
   #options_transc = whisper.DecodingOptions(fp16 = False, language=lang, task='transcribe') #lang
   options_transl = whisper.DecodingOptions(fp16 = False, language='en', task='translate') #lang
   #result_transc = whisper.decode(model_med, mel, options_transc)
+  result_transl = whisper.decode(model, mel, options_transl)  #model_med
   # print the recognized text
   #print(f"transcript is : {result_transc.text}")