Spaces:
Runtime error
Runtime error
NTT123
commited on
Commit
•
2d49958
1
Parent(s):
e4abdca
use reduction factor of 1.
Browse files- .gitattributes +1 -1
- app.py +1 -1
- inference.py +1 -1
- pretrained_model_ljs_500k.ckpt → pretrained_model_ljs_570k.ckpt +2 -2
- tacotron.toml +1 -1
.gitattributes
CHANGED
@@ -25,7 +25,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
25 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
26 |
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
27 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
28 |
-
pretrained_model_ljs_500k.ckpt filter=lfs diff=lfs merge=lfs -text
|
29 |
bazelisk-linux-amd64 filter=lfs diff=lfs merge=lfs -text
|
30 |
wavegru.ckpt filter=lfs diff=lfs merge=lfs -text
|
31 |
wavegru_mod.so filter=lfs diff=lfs merge=lfs -text
|
|
|
|
25 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
26 |
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
27 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
28 |
bazelisk-linux-amd64 filter=lfs diff=lfs merge=lfs -text
|
29 |
wavegru.ckpt filter=lfs diff=lfs merge=lfs -text
|
30 |
wavegru_mod.so filter=lfs diff=lfs merge=lfs -text
|
31 |
+
pretrained_model_ljs_570k.ckpt filter=lfs diff=lfs merge=lfs -text
|
app.py
CHANGED
@@ -10,7 +10,7 @@ from inference import load_tacotron_model, load_wavegru_net, mel_to_wav, text_to
|
|
10 |
from wavegru_cpp import extract_weight_mask, load_wavegru_cpp
|
11 |
|
12 |
alphabet, tacotron_net, tacotron_config = load_tacotron_model(
|
13 |
-
"./alphabet.txt", "./tacotron.toml", "./
|
14 |
)
|
15 |
|
16 |
|
|
|
10 |
from wavegru_cpp import extract_weight_mask, load_wavegru_cpp
|
11 |
|
12 |
alphabet, tacotron_net, tacotron_config = load_tacotron_model(
|
13 |
+
"./alphabet.txt", "./tacotron.toml", "./pretrained_model_ljs_570k.ckpt"
|
14 |
)
|
15 |
|
16 |
|
inference.py
CHANGED
@@ -28,7 +28,7 @@ def load_tacotron_model(alphabet_file, config_file, model_file):
|
|
28 |
return alphabet, net, config
|
29 |
|
30 |
|
31 |
-
tacotron_inference_fn = pax.pure(lambda net, text: net.inference(text, max_len=
|
32 |
|
33 |
|
34 |
def text_to_mel(net, text, alphabet, config):
|
|
|
28 |
return alphabet, net, config
|
29 |
|
30 |
|
31 |
+
tacotron_inference_fn = pax.pure(lambda net, text: net.inference(text, max_len=2400))
|
32 |
|
33 |
|
34 |
def text_to_mel(net, text, alphabet, config):
|
pretrained_model_ljs_500k.ckpt → pretrained_model_ljs_570k.ckpt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed5e35d9f290c45e229fe8135218e9e626eb3fdb4e48909721752e228f9f07ad
|
3 |
+
size 53525995
|
tacotron.toml
CHANGED
@@ -19,7 +19,7 @@ PAD_TOKEN = 0
|
|
19 |
TEST_DATA_SIZE = 1024
|
20 |
|
21 |
# model
|
22 |
-
RR =
|
23 |
MAX_RR=2
|
24 |
ATTN_BIAS = 0.0 # control how slow the attention moves forward
|
25 |
SIGMOID_NOISE = 2.0
|
|
|
19 |
TEST_DATA_SIZE = 1024
|
20 |
|
21 |
# model
|
22 |
+
RR = 1 # reduction factor
|
23 |
MAX_RR=2
|
24 |
ATTN_BIAS = 0.0 # control how slow the attention moves forward
|
25 |
SIGMOID_NOISE = 2.0
|