Spaces:
Paused
Paused
Update app.py
Browse files
app.py
CHANGED
@@ -24,9 +24,15 @@ def whisper_speech_demo(text, lang, speaker_audio, mix_lang, mix_text):
|
|
24 |
print(f"Text: {text}, Lang: {lang}, Speaker Audio: {speaker_audio}, Mix Lang: {mix_lang}, Mix Text: {mix_text}")
|
25 |
pipe = Pipeline()
|
26 |
speaker_url = speaker_audio if speaker_audio is not None else None
|
|
|
|
|
|
|
|
|
|
|
|
|
27 |
|
28 |
if mix_lang and mix_text:
|
29 |
-
mixed_langs = mix_lang
|
30 |
mixed_texts = mix_text.split(',')
|
31 |
stoks = pipe.t2s.generate(mixed_texts, lang=mixed_langs)
|
32 |
audio_data = pipe.generate(stoks, speaker_url, lang=mixed_langs[0])
|
@@ -42,8 +48,8 @@ def whisper_speech_demo(text, lang, speaker_audio, mix_lang, mix_text):
|
|
42 |
audio_stereo = np.stack((audio_np, audio_np), axis=-1)
|
43 |
audio_stereo = audio_stereo.reshape(-1, 2)
|
44 |
|
45 |
-
|
46 |
-
|
47 |
with tempfile.NamedTemporaryFile(suffix='.wav', delete=False) as tmp_file:
|
48 |
sf.write(tmp_file.name, audio_stereo, 24000, format='WAV', subtype='PCM_16')
|
49 |
return tmp_file.name
|
|
|
24 |
print(f"Text: {text}, Lang: {lang}, Speaker Audio: {speaker_audio}, Mix Lang: {mix_lang}, Mix Text: {mix_text}")
|
25 |
pipe = Pipeline()
|
26 |
speaker_url = speaker_audio if speaker_audio is not None else None
|
27 |
+
if isinstance(lang, list):
|
28 |
+
if not lang:
|
29 |
+
raise ValueError("Language list is empty.")
|
30 |
+
lang = lang[0]
|
31 |
+
elif not isinstance(lang, str):
|
32 |
+
raise ValueError("Language is not specified correctly.")
|
33 |
|
34 |
if mix_lang and mix_text:
|
35 |
+
mixed_langs = mix_lang.split(',') if isinstance(mix_lang, str) else mix_lang
|
36 |
mixed_texts = mix_text.split(',')
|
37 |
stoks = pipe.t2s.generate(mixed_texts, lang=mixed_langs)
|
38 |
audio_data = pipe.generate(stoks, speaker_url, lang=mixed_langs[0])
|
|
|
48 |
audio_stereo = np.stack((audio_np, audio_np), axis=-1)
|
49 |
audio_stereo = audio_stereo.reshape(-1, 2)
|
50 |
|
51 |
+
print("Audio Array Shape:", audio_stereo.shape)
|
52 |
+
print("Audio Array Dtype:", audio_stereo.dtype)
|
53 |
with tempfile.NamedTemporaryFile(suffix='.wav', delete=False) as tmp_file:
|
54 |
sf.write(tmp_file.name, audio_stereo, 24000, format='WAV', subtype='PCM_16')
|
55 |
return tmp_file.name
|