Spaces:
Running
Running
csukuangfj
commited on
Commit
•
dd6a80b
1
Parent(s):
cbfcc94
update sherpa-onnx to use piper-phonemize
Browse files- app.py +13 -0
- model.py +2 -7
- requirements.txt +1 -1
app.py
CHANGED
@@ -25,6 +25,7 @@ import uuid
|
|
25 |
|
26 |
import gradio as gr
|
27 |
import soundfile as sf
|
|
|
28 |
|
29 |
from model import get_pretrained_model, language_to_models
|
30 |
|
@@ -185,7 +186,19 @@ with demo:
|
|
185 |
|
186 |
gr.Markdown(description)
|
187 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
188 |
if __name__ == "__main__":
|
|
|
189 |
formatter = "%(asctime)s %(levelname)s [%(filename)s:%(lineno)d] %(message)s"
|
190 |
|
191 |
logging.basicConfig(format=formatter, level=logging.INFO)
|
|
|
25 |
|
26 |
import gradio as gr
|
27 |
import soundfile as sf
|
28 |
+
import system
|
29 |
|
30 |
from model import get_pretrained_model, language_to_models
|
31 |
|
|
|
186 |
|
187 |
gr.Markdown(description)
|
188 |
|
189 |
+
|
190 |
+
def download_espeak_ng_data():
|
191 |
+
os.sytem(
|
192 |
+
"""
|
193 |
+
cd /tmp
|
194 |
+
wget https://github.com/k2-fsa/sherpa-onnx/releases/download/tts-models/espeak-ng-data.tar.bz2
|
195 |
+
tar xf espeak-ng-data.tar.bz2
|
196 |
+
"""
|
197 |
+
)
|
198 |
+
|
199 |
+
|
200 |
if __name__ == "__main__":
|
201 |
+
download_espeak_ng_data()
|
202 |
formatter = "%(asctime)s %(levelname)s [%(filename)s:%(lineno)d] %(message)s"
|
203 |
|
204 |
logging.basicConfig(format=formatter, level=logging.INFO)
|
model.py
CHANGED
@@ -124,12 +124,6 @@ def _get_vits_piper(repo_id: str, speed: float) -> sherpa_onnx.OfflineTts:
|
|
124 |
subfolder=".",
|
125 |
)
|
126 |
|
127 |
-
lexicon = get_file(
|
128 |
-
repo_id=repo_id,
|
129 |
-
filename="lexicon.txt",
|
130 |
-
subfolder=".",
|
131 |
-
)
|
132 |
-
|
133 |
tokens = get_file(
|
134 |
repo_id=repo_id,
|
135 |
filename="tokens.txt",
|
@@ -140,7 +134,8 @@ def _get_vits_piper(repo_id: str, speed: float) -> sherpa_onnx.OfflineTts:
|
|
140 |
model=sherpa_onnx.OfflineTtsModelConfig(
|
141 |
vits=sherpa_onnx.OfflineTtsVitsModelConfig(
|
142 |
model=model,
|
143 |
-
lexicon=
|
|
|
144 |
tokens=tokens,
|
145 |
length_scale=1.0 / speed,
|
146 |
),
|
|
|
124 |
subfolder=".",
|
125 |
)
|
126 |
|
|
|
|
|
|
|
|
|
|
|
|
|
127 |
tokens = get_file(
|
128 |
repo_id=repo_id,
|
129 |
filename="tokens.txt",
|
|
|
134 |
model=sherpa_onnx.OfflineTtsModelConfig(
|
135 |
vits=sherpa_onnx.OfflineTtsVitsModelConfig(
|
136 |
model=model,
|
137 |
+
lexicon="",
|
138 |
+
data_dir="/tmp/espeak-ng-data",
|
139 |
tokens=tokens,
|
140 |
length_scale=1.0 / speed,
|
141 |
),
|
requirements.txt
CHANGED
@@ -1,4 +1,4 @@
|
|
1 |
-
https://huggingface.co/csukuangfj/wheels/resolve/main/sherpa_onnx-1.8.
|
2 |
#sherpa-onnx
|
3 |
|
4 |
soundfile
|
|
|
1 |
+
https://huggingface.co/csukuangfj/wheels/resolve/main/sherpa_onnx-1.8.11-cp38-cp38-linux_x86_64.whl
|
2 |
#sherpa-onnx
|
3 |
|
4 |
soundfile
|