StyleTTS2-Public-API-2

Running

App Files Files Community

Dupaja commited on Jan 4, 2024

Commit

c00de09

1 Parent(s): 609b399

Update app.py

Browse files

Files changed (1) hide show

app.py +3 -31

app.py CHANGED Viewed

@@ -46,39 +46,16 @@ for v in voicelist:
 def synthesize(text, voice, lngsteps, password, progress=gr.Progress()):
     if text.strip() == "":
         raise gr.Error("You must enter some text")
-    if len(text) > 50000:
-        raise gr.Error("Text must be <50k characters")
     texts = split_and_recombine_text(text)
     v = voice.lower()
     audios = []
     for t in progress.tqdm(texts):
         audios.append(styletts2importable.inference(t, voices[v], alpha=0.3, beta=0.7, diffusion_steps=lngsteps, embedding_scale=1))
     return (24000, np.concatenate(audios))
-# def longsynthesize(text, voice, lngsteps, password, progress=gr.Progress()):
-#     if password == os.environ['ACCESS_CODE']:
-#         if text.strip() == "":
-#             raise gr.Error("You must enter some text")
-#         if lngsteps > 25:
-#             raise gr.Error("Max 25 steps")
-#         if lngsteps < 5:
-#             raise gr.Error("Min 5 steps")
-#         texts = split_and_recombine_text(text)
-#         v = voice.lower()
-#         audios = []
-#         for t in progress.tqdm(texts):
-#             audios.append(styletts2importable.inference(t, voices[v], alpha=0.3, beta=0.7, diffusion_steps=lngsteps, embedding_scale=1))
-#         return (24000, np.concatenate(audios))
-#     else:
-#         raise gr.Error('Wrong access code')
 def clsynthesize(text, voice, vcsteps, progress=gr.Progress()):
-    # if text.strip() == "":
-    #     raise gr.Error("You must enter some text")
-    # # if global_phonemizer.phonemize([text]) > 300:
-    # if len(text) > 400:
-    #     raise gr.Error("Text must be under 400 characters")
-    # # return (24000, styletts2importable.inference(text, styletts2importable.compute_style(voice), alpha=0.3, beta=0.7, diffusion_steps=20, embedding_scale=1))
-    # return (24000, styletts2importable.inference(text, styletts2importable.compute_style(voice), alpha=0.3, beta=0.7, diffusion_steps=vcsteps, embedding_scale=1))
-    if text.strip() == "":
         raise gr.Error("You must enter some text")
     if len(text) > 50000:
         raise gr.Error("Text must be <50k characters")
@@ -88,11 +65,6 @@ def clsynthesize(text, voice, vcsteps, progress=gr.Progress()):
         audios.append(styletts2importable.inference(t, styletts2importable.compute_style(voice), alpha=0.3, beta=0.7, diffusion_steps=vcsteps, embedding_scale=1))
     return (24000, np.concatenate(audios))
 def ljsynthesize(text, steps, progress=gr.Progress()):
-    # if text.strip() == "":
-    #     raise gr.Error("You must enter some text")
-    # # if global_phonemizer.phonemize([text]) > 300:
-    # if len(text) > 400:
-    #     raise gr.Error("Text must be under 400 characters")
     noise = torch.randn(1,1,256).to('cuda' if torch.cuda.is_available() else 'cpu')
     # return (24000, ljspeechimportable.inference(text, noise, diffusion_steps=7, embedding_scale=1))
     if text.strip() == "":

 def synthesize(text, voice, lngsteps, password, progress=gr.Progress()):
     if text.strip() == "":
         raise gr.Error("You must enter some text")
     texts = split_and_recombine_text(text)
     v = voice.lower()
     audios = []
     for t in progress.tqdm(texts):
         audios.append(styletts2importable.inference(t, voices[v], alpha=0.3, beta=0.7, diffusion_steps=lngsteps, embedding_scale=1))
     return (24000, np.concatenate(audios))
 def clsynthesize(text, voice, vcsteps, progress=gr.Progress()):
+     if text.strip() == "":
         raise gr.Error("You must enter some text")
     if len(text) > 50000:
         raise gr.Error("Text must be <50k characters")
         audios.append(styletts2importable.inference(t, styletts2importable.compute_style(voice), alpha=0.3, beta=0.7, diffusion_steps=vcsteps, embedding_scale=1))
     return (24000, np.concatenate(audios))
 def ljsynthesize(text, steps, progress=gr.Progress()):
     noise = torch.randn(1,1,256).to('cuda' if torch.cuda.is_available() else 'cpu')
     # return (24000, ljspeechimportable.inference(text, noise, diffusion_steps=7, embedding_scale=1))
     if text.strip() == "":