File size: 4,349 Bytes
9bd9742
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
{
  "train": {
    "log_interval": 20,
    "eval_interval": 500,
    "seed": 52,
    "epochs": 10000,
    "learning_rate": 1e-04,
    "betas": [
      0.8,
      0.99
    ],
    "eps": 1e-09,
    "batch_size": 1,
    "fp16_run": true,
    "lr_decay": 0.999875,
    "segment_size": 16384,
    "init_lr_ratio": 1,
    "warmup_ratio": 0.1,
    "clipping_grad_norm": 10,
    "c_mel": 45,
    "c_kl": 1.0,
    "skip_optimizer": true
  },
  "data": {
    "training_files": "filelists/train-val-1.list",
    "validation_files": "filelists/val-1.list",
    "max_wav_value": 32768.0,
    "sampling_rate": 44100,
    "filter_length": 2048,
    "hop_length": 512,
    "win_length": 2048,
    "n_mel_channels": 128,
    "mel_fmin": 0.0,
    "mel_fmax": null,
    "add_blank": true,
    "n_speakers": 256,
    "cleaned_text": true,
    "spk2id": {
      "特别周": 0,
      "无声铃鹿": 1,
      "丸善斯基": 2,
      "富士奇迹": 3,
      "东海帝皇": 4,
      "小栗帽": 5,
      "黄金船": 6,
      "伏特加": 7,
      "大和赤骥": 8,
      "菱亚马逊": 9,
      "草上飞": 10,
      "大树快车": 11,
      "目白麦昆": 12,
      "神鹰": 13,
      "鲁道夫象征": 14,
      "好歌剧": 15,
      "成田白仁": 16,
      "爱丽数码": 17,
      "美妙姿势": 18,
      "摩耶重炮": 19,
      "玉藻十字": 20,
      "琵琶晨光": 21,
      "目白赖恩": 22,
      "美浦波旁": 23,
      "雪中美人": 24,
      "米浴": 25,
      "爱丽速子": 26,
      "爱慕织姬": 27,
      "曼城茶座": 28,
      "气槽": 29,
      "星云天空": 30,
      "菱曙": 31,
      "艾尼斯风神": 32,
      "稻荷一": 33,
      "空中神宫": 34,
      "川上公主": 35,
      "黄金城": 36,
      "真机伶": 37,
      "荣进闪耀": 38,
      "采珠": 39,
      "新光风": 40,
      "超级小海湾": 41,
      "荒漠英雄": 42,
      "东瀛佐敦": 43,
      "中山庆典": 44,
      "成田大进": 45,
      "西野花": 46,
      "醒目飞鹰": 47,
      "春乌拉拉": 48,
      "青竹回忆": 49,
      "待兼福来": 50,
      "Mr CB": 51,
      "美丽周日": 52,
      "名将怒涛": 53,
      "帝王光辉": 54,
      "待兼诗歌剧": 55,
      "生野狄杜斯": 56,
      "优秀素质": 57,
      "双涡轮": 58,
      "目白多伯": 59,
      "目白善信": 60,
      "大拓太阳神": 61,
      "北部玄驹": 62,
      "目白阿尔丹": 63,
      "八重无敌": 64,
      "里见光钻": 65,
      "天狼星象征": 66,
      "樱花桂冠": 67,
      "成田路": 68,
      "也文摄辉": 69,
      "吉兆": 70,
      "鹤丸刚志": 71,
      "谷野美酒": 72,
      "第一红宝石": 73,
      "目白高峰": 74,
      "真弓快车": 75,
      "里见皇冠": 76,
      "高尚骏逸": 77,
      "凯斯奇迹": 78,
      "森林宝穴": 79,
      "小林力奇": 80,
      "奇瑞骏": 81,
      "葛城王牌": 82,
      "新宇宙": 83,
      "菱钻奇宝": 84,
      "望族": 85,
      "骏川手纲": 86,
      "秋川弥生": 87,
      "乙名史悦子": 88,
      "桐生院葵": 89,
      "安心泽刺刺美": 90,
      "达利阿拉伯": 91,
      "高多芬柏布": 92,
      "佐岳五月": 93,
      "胜利奖券": 94,
      "樱花进王": 95,
      "东商变革": 96,
      "微光飞驹": 97,
      "樱花千代王": 98,
      "跳舞城": 99,
      "樫本理子": 100,
      "明亮圣辉": 101,
      "拜耶土耳其": 102
    }
  },
  "model": {
    "use_spk_conditioned_encoder": true,
    "use_noise_scaled_mas": true,
    "use_mel_posterior_encoder": false,
    "use_duration_discriminator": true,
    "inter_channels": 192,
    "hidden_channels": 192,
    "filter_channels": 768,
    "n_heads": 2,
    "n_layers": 6,
    "kernel_size": 3,
    "p_dropout": 0.1,
    "resblock": "1",
    "resblock_kernel_sizes": [
      3,
      7,
      11
    ],
    "resblock_dilation_sizes": [
      [
        1,
        3,
        5
      ],
      [
        1,
        3,
        5
      ],
      [
        1,
        3,
        5
      ]
    ],
    "upsample_rates": [
      8,
      8,
      2,
      2,
      2
    ],
    "upsample_initial_channel": 512,
    "upsample_kernel_sizes": [
      16,
      16,
      8,
      2,
      2
    ],
    "n_layers_q": 3,
    "use_spectral_norm": false,
    "gin_channels": 256
  }
}