NTT123 commited on
Commit
2d49958
1 Parent(s): e4abdca

use reduction factor of 1.

Browse files
.gitattributes CHANGED
@@ -25,7 +25,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
28
- pretrained_model_ljs_500k.ckpt filter=lfs diff=lfs merge=lfs -text
29
  bazelisk-linux-amd64 filter=lfs diff=lfs merge=lfs -text
30
  wavegru.ckpt filter=lfs diff=lfs merge=lfs -text
31
  wavegru_mod.so filter=lfs diff=lfs merge=lfs -text
 
 
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
28
  bazelisk-linux-amd64 filter=lfs diff=lfs merge=lfs -text
29
  wavegru.ckpt filter=lfs diff=lfs merge=lfs -text
30
  wavegru_mod.so filter=lfs diff=lfs merge=lfs -text
31
+ pretrained_model_ljs_570k.ckpt filter=lfs diff=lfs merge=lfs -text
app.py CHANGED
@@ -10,7 +10,7 @@ from inference import load_tacotron_model, load_wavegru_net, mel_to_wav, text_to
10
  from wavegru_cpp import extract_weight_mask, load_wavegru_cpp
11
 
12
  alphabet, tacotron_net, tacotron_config = load_tacotron_model(
13
- "./alphabet.txt", "./tacotron.toml", "./pretrained_model_ljs_500k.ckpt"
14
  )
15
 
16
 
 
10
  from wavegru_cpp import extract_weight_mask, load_wavegru_cpp
11
 
12
  alphabet, tacotron_net, tacotron_config = load_tacotron_model(
13
+ "./alphabet.txt", "./tacotron.toml", "./pretrained_model_ljs_570k.ckpt"
14
  )
15
 
16
 
inference.py CHANGED
@@ -28,7 +28,7 @@ def load_tacotron_model(alphabet_file, config_file, model_file):
28
  return alphabet, net, config
29
 
30
 
31
- tacotron_inference_fn = pax.pure(lambda net, text: net.inference(text, max_len=1200))
32
 
33
 
34
  def text_to_mel(net, text, alphabet, config):
 
28
  return alphabet, net, config
29
 
30
 
31
+ tacotron_inference_fn = pax.pure(lambda net, text: net.inference(text, max_len=2400))
32
 
33
 
34
  def text_to_mel(net, text, alphabet, config):
pretrained_model_ljs_500k.ckpt → pretrained_model_ljs_570k.ckpt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4eabdcac35cd016469d17678f9549bd25d1c9bf66c9089ea9f0632619ba91194
3
- size 53221435
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed5e35d9f290c45e229fe8135218e9e626eb3fdb4e48909721752e228f9f07ad
3
+ size 53525995
tacotron.toml CHANGED
@@ -19,7 +19,7 @@ PAD_TOKEN = 0
19
  TEST_DATA_SIZE = 1024
20
 
21
  # model
22
- RR = 2 # reduction factor
23
  MAX_RR=2
24
  ATTN_BIAS = 0.0 # control how slow the attention moves forward
25
  SIGMOID_NOISE = 2.0
 
19
  TEST_DATA_SIZE = 1024
20
 
21
  # model
22
+ RR = 1 # reduction factor
23
  MAX_RR=2
24
  ATTN_BIAS = 0.0 # control how slow the attention moves forward
25
  SIGMOID_NOISE = 2.0