Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -14,10 +14,10 @@ vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
|
|
14 |
|
15 |
speaker_embeddings = {
|
16 |
"BDL": "spkemb/triniFemale.npy",
|
17 |
-
|
18 |
-
|
19 |
-
|
20 |
-
|
21 |
}
|
22 |
|
23 |
|
@@ -59,16 +59,16 @@ def predict(text, speaker):
|
|
59 |
|
60 |
title = "SpeechT5: Speech Synthesis"
|
61 |
|
62 |
-
description = "
|
63 |
-
The <b>SpeechT5</b> model is pre-trained on text as well as speech inputs, with targets that are also a mix of text and speech.
|
64 |
-
By pre-training on text and speech at the same time, it learns unified representations for both, resulting in improved modeling capabilities.
|
65 |
|
66 |
-
SpeechT5 can be fine-tuned for different speech tasks. This space demonstrates the <b>text-to-speech</b> (TTS) checkpoint for the English language.
|
67 |
|
68 |
-
See also the <a href="https://huggingface.co/spaces/Matthijs/speecht5-asr-demo">speech recognition (ASR) demo</a>
|
69 |
-
and the <a href="https://huggingface.co/spaces/Matthijs/speecht5-vc-demo">voice conversion demo</a>.
|
70 |
|
71 |
-
Refer to <a href="https://colab.research.google.com/drive/1i7I5pzBcU3WDFarDnzweIj4-sVVoIUFJ">this Colab notebook</a> to learn how to fine-tune the SpeechT5 TTS model on your own dataset or language.
|
72 |
|
73 |
<b>How to use:</b> Enter some English text and choose a speaker. The output is a mel spectrogram, which is converted to a mono 16 kHz waveform by the
|
74 |
HiFi-GAN vocoder. Because the model always applies random dropout, each attempt will give slightly different results.
|
@@ -91,14 +91,14 @@ article = """
|
|
91 |
primaryClass={eess.AS},
|
92 |
year={2021}
|
93 |
}
|
94 |
-
|
95 |
|
96 |
-
|
97 |
|
98 |
</div>
|
99 |
"""
|
100 |
|
101 |
-
#examples = [
|
102 |
#["It is not in the stars to hold our destiny but in ourselves.", "BDL (male)"],
|
103 |
#["The octopus and Oliver went to the opera in October.", "CLB (female)"],
|
104 |
#["She sells seashells by the seashore. I saw a kitten eating chicken in the kitchen.", "RMS (male)"],
|
|
|
14 |
|
15 |
speaker_embeddings = {
|
16 |
"BDL": "spkemb/triniFemale.npy",
|
17 |
+
"CLB": "spkemb/triniFemale.npy",
|
18 |
+
"KSP": "spkemb/triniFemale.npy",
|
19 |
+
"RMS": "spkemb/triniFemale.npy",
|
20 |
+
"SLT": "spkemb/triniFemale.npy",
|
21 |
}
|
22 |
|
23 |
|
|
|
59 |
|
60 |
title = "SpeechT5: Speech Synthesis"
|
61 |
|
62 |
+
#description = "
|
63 |
+
#The <b>SpeechT5</b> model is pre-trained on text as well as speech inputs, with targets that are also a mix of text and speech.
|
64 |
+
#By pre-training on text and speech at the same time, it learns unified representations for both, resulting in improved modeling capabilities.
|
65 |
|
66 |
+
#SpeechT5 can be fine-tuned for different speech tasks. This space demonstrates the <b>text-to-speech</b> (TTS) checkpoint for the English language.
|
67 |
|
68 |
+
#See also the <a href="https://huggingface.co/spaces/Matthijs/speecht5-asr-demo">speech recognition (ASR) demo</a>
|
69 |
+
#and the <a href="https://huggingface.co/spaces/Matthijs/speecht5-vc-demo">voice conversion demo</a>.
|
70 |
|
71 |
+
#Refer to <a href="https://colab.research.google.com/drive/1i7I5pzBcU3WDFarDnzweIj4-sVVoIUFJ">this Colab notebook</a> to learn how to fine-tune the SpeechT5 TTS model on your own dataset or language.
|
72 |
|
73 |
<b>How to use:</b> Enter some English text and choose a speaker. The output is a mel spectrogram, which is converted to a mono 16 kHz waveform by the
|
74 |
HiFi-GAN vocoder. Because the model always applies random dropout, each attempt will give slightly different results.
|
|
|
91 |
primaryClass={eess.AS},
|
92 |
year={2021}
|
93 |
}
|
94 |
+
#</pre>
|
95 |
|
96 |
+
#<p>Speaker embeddings were generated from <a href="http://www.festvox.org/cmu_arctic/">CMU ARCTIC</a> using <a href="https://huggingface.co/mechanicalsea/speecht5-vc/blob/main/manifest/utils/prep_cmu_arctic_spkemb.py">this script</a>.</p>
|
97 |
|
98 |
</div>
|
99 |
"""
|
100 |
|
101 |
+
#examples = [
|
102 |
#["It is not in the stars to hold our destiny but in ourselves.", "BDL (male)"],
|
103 |
#["The octopus and Oliver went to the opera in October.", "CLB (female)"],
|
104 |
#["She sells seashells by the seashore. I saw a kitten eating chicken in the kitchen.", "RMS (male)"],
|