unilight commited on
Commit
d6b61d7
1 Parent(s): 28dab9e

Upload with huggingface_hub

Browse files
.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:176b10dfa4ad8b4c66348e49740f1668cb209f424cb2d43d7fb359a76c3c27f3
3
+ size 170
TEF1/checkpoint-10000steps.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:275726ab0bb063ae5d44f81793d9d3ee8624cd563a01918cc01fd2f7ac02d118
3
+ size 339923709
TEF1/config.yml ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ additional_config: null
2
+ allow_cache: true
3
+ batch_size: 6
4
+ config: conf/taco2_ar.yaml
5
+ dev_scp: data/TEF1_dev/wav.scp
6
+ distributed: false
7
+ eval_interval_steps: 1000
8
+ fft_size: 1024
9
+ fmax: 7600
10
+ fmin: 80
11
+ global_gain_scale: 1.0
12
+ grad_norm: 1.0
13
+ hop_size: 256
14
+ init_checkpoint: ''
15
+ log_interval_steps: 100
16
+ main_loss_type: L1Loss
17
+ model_params:
18
+ ar: true
19
+ encoder_type: taco2
20
+ hidden_dim: 1024
21
+ lstmp_dropout_rate: 0.2
22
+ lstmp_layernorm: false
23
+ lstmp_layers: 2
24
+ lstmp_proj_dim: 256
25
+ prenet_dim: 256
26
+ prenet_dropout_rate: 0.5
27
+ prenet_layers: 2
28
+ model_type: Taco2_AR
29
+ num_mels: 80
30
+ num_save_intermediate_results: 4
31
+ num_workers: 2
32
+ optimizer_params:
33
+ lr: 0.0001
34
+ optimizer_type: AdamW
35
+ outdir: exp/TEF1_ppg_sxliu_taco2_ar
36
+ pin_memory: true
37
+ rank: 0
38
+ resume: ''
39
+ sampling_rate: 24000
40
+ save_interval_steps: 1000
41
+ scheduler: linear_schedule_with_warmup
42
+ scheduler_params:
43
+ num_warmup_steps: 4000
44
+ train_max_steps: 10000
45
+ train_scp: data/TEF1_train/wav.scp
46
+ trg_stats: exp/TEF1_ppg_sxliu_taco2_ar/stats.h5
47
+ trim_frame_size: 2048
48
+ trim_hop_size: 512
49
+ trim_silence: false
50
+ trim_threshold_in_db: 60
51
+ upstream: ppg_sxliu
52
+ verbose: 1
53
+ version: 0.1.5
54
+ vocoder:
55
+ checkpoint: ./downloads/pwg_task1/checkpoint-400000steps.pkl
56
+ config: ./downloads/pwg_task1/config.yml
57
+ stats: ./downloads/pwg_task1/stats.h5
58
+ win_length: null
59
+ window: hann
TEF1/stats.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a72312fe95d90db14a7fb5004e37a170b9331e585450ebbd5eb92470e132704
3
+ size 4736
TEF2/checkpoint-10000steps.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f29a4f3e7954b2fcb37d8c3a61928fd303587b0590a54baec2f03fd9b6b20b7e
3
+ size 339923709
TEF2/config.yml ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ additional_config: null
2
+ allow_cache: true
3
+ batch_size: 6
4
+ config: conf/taco2_ar.yaml
5
+ dev_scp: data/TEF2_dev/wav.scp
6
+ distributed: false
7
+ eval_interval_steps: 1000
8
+ fft_size: 1024
9
+ fmax: 7600
10
+ fmin: 80
11
+ global_gain_scale: 1.0
12
+ grad_norm: 1.0
13
+ hop_size: 256
14
+ init_checkpoint: ''
15
+ log_interval_steps: 100
16
+ main_loss_type: L1Loss
17
+ model_params:
18
+ ar: true
19
+ encoder_type: taco2
20
+ hidden_dim: 1024
21
+ lstmp_dropout_rate: 0.2
22
+ lstmp_layernorm: false
23
+ lstmp_layers: 2
24
+ lstmp_proj_dim: 256
25
+ prenet_dim: 256
26
+ prenet_dropout_rate: 0.5
27
+ prenet_layers: 2
28
+ model_type: Taco2_AR
29
+ num_mels: 80
30
+ num_save_intermediate_results: 4
31
+ num_workers: 2
32
+ optimizer_params:
33
+ lr: 0.0001
34
+ optimizer_type: AdamW
35
+ outdir: exp/TEF2_ppg_sxliu_taco2_ar
36
+ pin_memory: true
37
+ rank: 0
38
+ resume: ''
39
+ sampling_rate: 24000
40
+ save_interval_steps: 1000
41
+ scheduler: linear_schedule_with_warmup
42
+ scheduler_params:
43
+ num_warmup_steps: 4000
44
+ train_max_steps: 10000
45
+ train_scp: data/TEF2_train/wav.scp
46
+ trg_stats: exp/TEF2_ppg_sxliu_taco2_ar/stats.h5
47
+ trim_frame_size: 2048
48
+ trim_hop_size: 512
49
+ trim_silence: false
50
+ trim_threshold_in_db: 60
51
+ upstream: ppg_sxliu
52
+ verbose: 1
53
+ version: 0.1.5
54
+ vocoder:
55
+ checkpoint: ./downloads/pwg_task1/checkpoint-400000steps.pkl
56
+ config: ./downloads/pwg_task1/config.yml
57
+ stats: ./downloads/pwg_task1/stats.h5
58
+ win_length: null
59
+ window: hann
TEF2/stats.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84b0c2ec485638324d2bbadc1af4a878d9d4f552a8648d1ea4e46caa4fb4453e
3
+ size 4736
TEM1/checkpoint-10000steps.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b0a18462634e9b8b49b20fd44664c4c86fb31a676d65e582fcaa15cd1f1ad4d
3
+ size 339923709
TEM1/config.yml ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ additional_config: null
2
+ allow_cache: true
3
+ batch_size: 6
4
+ config: conf/taco2_ar.yaml
5
+ dev_scp: data/TEM1_dev/wav.scp
6
+ distributed: false
7
+ eval_interval_steps: 1000
8
+ fft_size: 1024
9
+ fmax: 7600
10
+ fmin: 80
11
+ global_gain_scale: 1.0
12
+ grad_norm: 1.0
13
+ hop_size: 256
14
+ init_checkpoint: ''
15
+ log_interval_steps: 100
16
+ main_loss_type: L1Loss
17
+ model_params:
18
+ ar: true
19
+ encoder_type: taco2
20
+ hidden_dim: 1024
21
+ lstmp_dropout_rate: 0.2
22
+ lstmp_layernorm: false
23
+ lstmp_layers: 2
24
+ lstmp_proj_dim: 256
25
+ prenet_dim: 256
26
+ prenet_dropout_rate: 0.5
27
+ prenet_layers: 2
28
+ model_type: Taco2_AR
29
+ num_mels: 80
30
+ num_save_intermediate_results: 4
31
+ num_workers: 2
32
+ optimizer_params:
33
+ lr: 0.0001
34
+ optimizer_type: AdamW
35
+ outdir: exp/TEM1_ppg_sxliu_taco2_ar
36
+ pin_memory: true
37
+ rank: 0
38
+ resume: ''
39
+ sampling_rate: 24000
40
+ save_interval_steps: 1000
41
+ scheduler: linear_schedule_with_warmup
42
+ scheduler_params:
43
+ num_warmup_steps: 4000
44
+ train_max_steps: 10000
45
+ train_scp: data/TEM1_train/wav.scp
46
+ trg_stats: exp/TEM1_ppg_sxliu_taco2_ar/stats.h5
47
+ trim_frame_size: 2048
48
+ trim_hop_size: 512
49
+ trim_silence: false
50
+ trim_threshold_in_db: 60
51
+ upstream: ppg_sxliu
52
+ verbose: 1
53
+ version: 0.1.5
54
+ vocoder:
55
+ checkpoint: ./downloads/pwg_task1/checkpoint-400000steps.pkl
56
+ config: ./downloads/pwg_task1/config.yml
57
+ stats: ./downloads/pwg_task1/stats.h5
58
+ win_length: null
59
+ window: hann
TEM1/stats.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1beb905d2af5d6906779fdbe3f621172ba9452bbd524bf5a0be6592933c4ad11
3
+ size 4736
TEM2/checkpoint-10000steps.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d43d40f6b0d2f507ad7549bbc2cc52455ba32dc9178e04a205ce57148ed56da2
3
+ size 339923709
TEM2/config.yml ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ additional_config: null
2
+ allow_cache: true
3
+ batch_size: 6
4
+ config: conf/taco2_ar.yaml
5
+ dev_scp: data/TEM2_dev/wav.scp
6
+ distributed: false
7
+ eval_interval_steps: 1000
8
+ fft_size: 1024
9
+ fmax: 7600
10
+ fmin: 80
11
+ global_gain_scale: 1.0
12
+ grad_norm: 1.0
13
+ hop_size: 256
14
+ init_checkpoint: ''
15
+ log_interval_steps: 100
16
+ main_loss_type: L1Loss
17
+ model_params:
18
+ ar: true
19
+ encoder_type: taco2
20
+ hidden_dim: 1024
21
+ lstmp_dropout_rate: 0.2
22
+ lstmp_layernorm: false
23
+ lstmp_layers: 2
24
+ lstmp_proj_dim: 256
25
+ prenet_dim: 256
26
+ prenet_dropout_rate: 0.5
27
+ prenet_layers: 2
28
+ model_type: Taco2_AR
29
+ num_mels: 80
30
+ num_save_intermediate_results: 4
31
+ num_workers: 2
32
+ optimizer_params:
33
+ lr: 0.0001
34
+ optimizer_type: AdamW
35
+ outdir: exp/TEM2_ppg_sxliu_taco2_ar
36
+ pin_memory: true
37
+ rank: 0
38
+ resume: ''
39
+ sampling_rate: 24000
40
+ save_interval_steps: 1000
41
+ scheduler: linear_schedule_with_warmup
42
+ scheduler_params:
43
+ num_warmup_steps: 4000
44
+ train_max_steps: 10000
45
+ train_scp: data/TEM2_train/wav.scp
46
+ trg_stats: exp/TEM2_ppg_sxliu_taco2_ar/stats.h5
47
+ trim_frame_size: 2048
48
+ trim_hop_size: 512
49
+ trim_silence: false
50
+ trim_threshold_in_db: 60
51
+ upstream: ppg_sxliu
52
+ verbose: 1
53
+ version: 0.1.5
54
+ vocoder:
55
+ checkpoint: ./downloads/pwg_task1/checkpoint-400000steps.pkl
56
+ config: ./downloads/pwg_task1/config.yml
57
+ stats: ./downloads/pwg_task1/stats.h5
58
+ win_length: null
59
+ window: hann
TEM2/stats.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a971e17114869a18ddadb8c467558e8ad1cc6ffc3c483af2503362241a80449b
3
+ size 4736