thealphamerc commited on
Commit
201db01
1 Parent(s): ebe9cbe

Added new sample voices audio

Browse files
.vscode/settings.json CHANGED
@@ -1,3 +1,7 @@
1
  {
2
- "cSpell.words": ["Elon"]
 
 
 
 
3
  }
 
1
  {
2
+ "cSpell.words": ["Elon"],
3
+ "[python]": {
4
+ "editor.defaultFormatter": "ms-python.autopep8"
5
+ },
6
+ "python.formatting.provider": "none"
7
  }
app.py CHANGED
@@ -2,16 +2,19 @@ from subprocess import call
2
  import gradio as gr
3
  import os
4
  from TTS.api import TTS
 
5
 
6
  # List available 🐸TTS models and choose the first one
7
- all_models = TTS.list_models()
8
  # for model in all_models:
9
  # print(model)
10
 
11
  # print("Using model: ", all_models[0])
12
- model = all_models[0]
13
  # Init TTS
14
 
 
 
15
 
16
  print("Downloading model...", '')
17
 
@@ -30,6 +33,10 @@ def run_cmd(command):
30
 
31
 
32
  def inference(text, speaker):
 
 
 
 
33
  if (speaker == 'Speaker-1'):
34
  speaker = 'input/amitabh.mp3'
35
  elif (speaker == 'Speaker-2'):
@@ -44,6 +51,10 @@ def inference(text, speaker):
44
  speaker = 'input/sample/Elon-Sample.wav'
45
  elif (speaker == 'Obama'):
46
  speaker = 'input/sample/Obama-sample.wav'
 
 
 
 
47
  else:
48
  speaker = 'input/z-default.wav'
49
  # print("speaker: ", speaker)
@@ -63,12 +74,12 @@ def inference(text, speaker):
63
 
64
 
65
  sampleInput = ['Speaker-1', 'Speaker-2', 'Speaker-3',
66
- 'Speaker-4', 'Rock', 'Elon', 'Obama']
67
- inputs = [gr.inputs.Textbox(lines=5, label="Input Text"),
68
- gr.inputs.Dropdown(
69
  sampleInput, label="Sample Input", default="Speaker-1",)
70
  ]
71
- outputs = gr.outputs.Audio(type="filepath", label="Output Audio")
72
  title = "Text To Speech"
73
  description = "An example of using TTS to generate speech from text."
74
  article = ""
 
2
  import gradio as gr
3
  import os
4
  from TTS.api import TTS
5
+ from TTS.utils.synthesizer import Synthesizer
6
 
7
  # List available 🐸TTS models and choose the first one
8
+ # all_models = TTS.list_models()
9
  # for model in all_models:
10
  # print(model)
11
 
12
  # print("Using model: ", all_models[0])
13
+ # model = all_models[0]
14
  # Init TTS
15
 
16
+ MAX_TXT_LEN = 500
17
+
18
 
19
  print("Downloading model...", '')
20
 
 
33
 
34
 
35
  def inference(text, speaker):
36
+ if len(text) > MAX_TXT_LEN:
37
+ text = text[:MAX_TXT_LEN]
38
+ print(
39
+ f"Input text was cutoff since it went over the {MAX_TXT_LEN} character limit.")
40
  if (speaker == 'Speaker-1'):
41
  speaker = 'input/amitabh.mp3'
42
  elif (speaker == 'Speaker-2'):
 
51
  speaker = 'input/sample/Elon-Sample.wav'
52
  elif (speaker == 'Obama'):
53
  speaker = 'input/sample/Obama-sample.wav'
54
+ elif (speaker == 'Tony'):
55
+ speaker = 'input/sample/tony-stark-2.wav'
56
+ elif (speaker == 'Madara Uchiha'):
57
+ speaker = 'input/sample/Madara.mp3'
58
  else:
59
  speaker = 'input/z-default.wav'
60
  # print("speaker: ", speaker)
 
74
 
75
 
76
  sampleInput = ['Speaker-1', 'Speaker-2', 'Speaker-3',
77
+ 'Speaker-4', 'Rock', 'Elon', 'Obama', 'Tony', 'Madara Uchiha']
78
+ inputs = [gr.Textbox(lines=5, label="Input Text"),
79
+ gr.Dropdown(
80
  sampleInput, label="Sample Input", default="Speaker-1",)
81
  ]
82
+ outputs = gr.Audio(type="filepath", label="Output Audio")
83
  title = "Text To Speech"
84
  description = "An example of using TTS to generate speech from text."
85
  article = ""
gradio_queue.db CHANGED
Binary files a/gradio_queue.db and b/gradio_queue.db differ
 
input/sample/Madara.mp3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:601c62ffb87f3879576194637190758defa9a13000c3fb38f814332a64e6835e
3
+ size 259062
input/sample/tony-stark-2.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:106c43d952d7caf2d9e372cf4f74c7febde7a8a543532b5fc5e3a02ab4956cc3
3
+ size 99862
input/sample/tony-stark.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a46f91b72ca5825e4166652af58155bb6c8e764b368b51da0652775a104c19fb
3
+ size 17998
output/output.wav CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:07abadaef514caf57a002e76da940e5900a6851ccba39076c3e7eb4359fdf82d
3
- size 1364620
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6cbd93714af794b46b7ccd96d30949ae39b55343bb841abf37a2d17b4ce4824
3
+ size 172108