Spaces:
Runtime error
Runtime error
update
Browse files
app.py
CHANGED
@@ -26,27 +26,6 @@ def query(payload):
|
|
26 |
# Model 1: Whisper: Speech-to-text
|
27 |
model = whisper.load_model("base")
|
28 |
#model_med = whisper.load_model("medium")
|
29 |
-
# Languages covered in Whisper - (exhaustive list) :
|
30 |
-
#"en": "english", "zh": "chinese", "de": "german", "es": "spanish", "ru": "russian",
|
31 |
-
#"ko": "korean", "fr": "french", "ja": "japanese", "pt": "portuguese", "tr": "turkish",
|
32 |
-
#"pl": "polish", "ca": "catalan", "nl": "dutch", "ar": "arabic", "sv": "swedish",
|
33 |
-
#"it": "italian", "id": "indonesian", "hi": "hindi", "fi": "finnish", "vi": "vietnamese",
|
34 |
-
#"iw": "hebrew", "uk": "ukrainian", "el": "greek", "ms": "malay", "cs": "czech",
|
35 |
-
#"ro": "romanian", "da": "danish", "hu": "hungarian", "ta": "tamil", "no": "norwegian",
|
36 |
-
#"th": "thai", "ur": "urdu", "hr": "croatian", "bg": "bulgarian", "lt": "lithuanian",
|
37 |
-
#"la": "latin", "mi": "maori", "ml": "malayalam", "cy": "welsh", "sk": "slovak",
|
38 |
-
#"te": "telugu", "fa": "persian", "lv": "latvian", "bn": "bengali", "sr": "serbian",
|
39 |
-
#"az": "azerbaijani", "sl": "slovenian", "kn": "kannada", "et": "estonian",
|
40 |
-
#"mk": "macedonian", "br": "breton", "eu": "basque", "is": "icelandic", "hy": "armenian",
|
41 |
-
#"ne": "nepali", "mn": "mongolian", "bs": "bosnian", "kk": "kazakh", "sq": "albanian",
|
42 |
-
#"sw": "swahili", "gl": "galician", "mr": "marathi", "pa": "punjabi", "si": "sinhala",
|
43 |
-
#"km": "khmer", "sn": "shona", "yo": "yoruba", "so": "somali", "af": "afrikaans",
|
44 |
-
#"oc": "occitan", "ka": "georgian", "be": "belarusian", "tg": "tajik", "sd": "sindhi",
|
45 |
-
#"gu": "gujarati", "am": "amharic", "yi": "yiddish", "lo": "lao", "uz": "uzbek",
|
46 |
-
#"fo": "faroese", "ht": "haitian creole", "ps": "pashto", "tk": "turkmen", "nn": "nynorsk",
|
47 |
-
#"mt": "maltese", "sa": "sanskrit", "lb": "luxembourgish", "my": "myanmar", "bo": "tibetan",
|
48 |
-
#"tl": "tagalog", "mg": "malagasy", "as": "assamese", "tt": "tatar", "haw": "hawaiian",
|
49 |
-
#"ln": "lingala", "ha": "hausa", "ba": "bashkir", "jw": "javanese", "su": "sundanese",
|
50 |
|
51 |
|
52 |
#Model 2: Text-to-Speech
|
@@ -54,16 +33,11 @@ LANGUAGES = list(CoquiTTS.langs.keys())
|
|
54 |
coquiTTS = CoquiTTS()
|
55 |
print(f"Languages for Coqui are: {LANGUAGES}")
|
56 |
#Languages for Coqui are: ['en', 'es', 'fr', 'de', 'pl', 'uk', 'ro', 'hu', 'el', 'bg', 'nl', 'fi', 'sl', 'lv', 'ga']
|
57 |
-
# en - English, es - Spanish, fr - French, de - German, pl - Polish
|
58 |
-
# uk - Ukrainian, ro - Romanian, hu - Hungarian, el - Greek, bg - Bulgarian,
|
59 |
-
# nl - dutch, fi - finnish, sl - slovenian, lv - latvian, ga - ??
|
60 |
-
|
61 |
|
62 |
|
63 |
# Driver function
|
64 |
def driver_fun(audio) :
|
65 |
translation, lang = whisper_stt(audio) # older : transcribe, translation, lang
|
66 |
-
#text1 = model.transcribe(audio)["text"]
|
67 |
|
68 |
random_val = random.randrange(0,231657)
|
69 |
if random_val < 226657:
|
|
|
26 |
# Model 1: Whisper: Speech-to-text
|
27 |
model = whisper.load_model("base")
|
28 |
#model_med = whisper.load_model("medium")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
29 |
|
30 |
|
31 |
#Model 2: Text-to-Speech
|
|
|
33 |
coquiTTS = CoquiTTS()
|
34 |
print(f"Languages for Coqui are: {LANGUAGES}")
|
35 |
#Languages for Coqui are: ['en', 'es', 'fr', 'de', 'pl', 'uk', 'ro', 'hu', 'el', 'bg', 'nl', 'fi', 'sl', 'lv', 'ga']
|
|
|
|
|
|
|
|
|
36 |
|
37 |
|
38 |
# Driver function
|
39 |
def driver_fun(audio) :
|
40 |
translation, lang = whisper_stt(audio) # older : transcribe, translation, lang
|
|
|
41 |
|
42 |
random_val = random.randrange(0,231657)
|
43 |
if random_val < 226657:
|