|
{ |
|
"train": { |
|
"log_interval": 200, |
|
"eval_interval": 1000, |
|
"seed": 42, |
|
"epochs": 10000, |
|
"learning_rate": 0.0002, |
|
"betas": [ |
|
0.8, |
|
0.99 |
|
], |
|
"eps": 1e-09, |
|
"batch_size": 24, |
|
"fp16_run": false, |
|
"lr_decay": 0.99995, |
|
"segment_size": 16384, |
|
"init_lr_ratio": 1, |
|
"warmup_epochs": 0, |
|
"c_mel": 45, |
|
"c_kl": 1.0, |
|
"skip_optimizer": true |
|
}, |
|
"data": { |
|
"training_files": "filelists/train.list", |
|
"validation_files": "filelists/val.list", |
|
"max_wav_value": 32768.0, |
|
"sampling_rate": 22050, |
|
"filter_length": 2048, |
|
"hop_length": 512, |
|
"win_length": 2048, |
|
"n_mel_channels": 128, |
|
"mel_fmin": 0.0, |
|
"mel_fmax": null, |
|
"add_blank": true, |
|
"n_speakers": 700, |
|
"cleaned_text": true, |
|
"spk2id": { |
|
"老克勒": 0, |
|
"美琳": 1, |
|
"Jane": 2, |
|
"小贝": 3, |
|
"SSB0005": 4, |
|
"SSB0009": 5, |
|
"SSB0011": 6, |
|
"SSB0012": 7, |
|
"SSB0016": 8, |
|
"SSB0018": 9, |
|
"SSB0033": 10, |
|
"SSB0038": 11, |
|
"SSB0043": 12, |
|
"SSB0057": 13, |
|
"SSB0073": 14, |
|
"SSB0080": 15, |
|
"SSB0112": 16, |
|
"SSB0122": 17, |
|
"SSB0133": 18, |
|
"SSB0139": 19, |
|
"SSB0145": 20, |
|
"SSB0149": 21, |
|
"SSB0193": 22, |
|
"SSB0197": 23, |
|
"SSB0200": 24, |
|
"SSB0241": 25, |
|
"SSB0246": 26, |
|
"SSB0261": 27, |
|
"SSB0267": 28, |
|
"SSB0273": 29, |
|
"SSB0287": 30, |
|
"SSB0288": 31, |
|
"SSB0299": 32, |
|
"SSB0307": 33, |
|
"SSB0309": 34, |
|
"SSB0315": 35, |
|
"SSB0316": 36, |
|
"SSB0323": 37, |
|
"SSB0338": 38, |
|
"SSB0339": 39, |
|
"SSB0341": 40, |
|
"SSB0342": 41, |
|
"SSB0354": 42, |
|
"SSB0366": 43, |
|
"SSB0375": 44, |
|
"SSB0379": 45, |
|
"SSB0380": 46, |
|
"SSB0382": 47, |
|
"SSB0385": 48, |
|
"SSB0393": 49, |
|
"SSB0394": 50, |
|
"SSB0395": 51, |
|
"SSB0407": 52, |
|
"SSB0415": 53, |
|
"SSB0426": 54, |
|
"SSB0427": 55, |
|
"SSB0434": 56, |
|
"SSB0435": 57, |
|
"SSB0470": 58, |
|
"SSB0482": 59, |
|
"SSB0502": 60, |
|
"SSB0534": 61, |
|
"SSB0535": 62, |
|
"SSB0539": 63, |
|
"SSB0544": 64, |
|
"SSB0565": 65, |
|
"SSB0570": 66, |
|
"SSB0578": 67, |
|
"SSB0588": 68, |
|
"SSB0590": 69, |
|
"SSB0594": 70, |
|
"SSB0599": 71, |
|
"SSB0601": 72, |
|
"SSB0603": 73, |
|
"SSB0606": 74, |
|
"SSB0607": 75, |
|
"SSB0609": 76, |
|
"SSB0614": 77, |
|
"SSB0623": 78, |
|
"SSB0629": 79, |
|
"SSB0631": 80, |
|
"SSB0632": 81, |
|
"SSB0666": 82, |
|
"SSB0668": 83, |
|
"SSB0671": 84, |
|
"SSB0686": 85, |
|
"SSB0700": 86, |
|
"SSB0710": 87, |
|
"SSB0720": 88, |
|
"SSB0723": 89, |
|
"SSB0737": 90, |
|
"SSB0746": 91, |
|
"SSB0748": 92, |
|
"SSB0751": 93, |
|
"SSB0758": 94, |
|
"SSB0760": 95, |
|
"SSB0762": 96, |
|
"SSB0778": 97, |
|
"SSB0780": 98, |
|
"SSB0784": 99, |
|
"SSB0786": 100, |
|
"SSB0794": 101, |
|
"SSB0817": 102, |
|
"SSB0851": 103, |
|
"SSB0863": 104, |
|
"SSB0871": 105, |
|
"SSB0887": 106, |
|
"SSB0913": 107, |
|
"SSB0915": 108, |
|
"SSB0919": 109, |
|
"SSB0935": 110, |
|
"SSB0966": 111, |
|
"SSB0987": 112, |
|
"SSB1008": 113, |
|
"SSB1020": 114, |
|
"SSB1024": 115, |
|
"SSB1050": 116, |
|
"SSB1055": 117, |
|
"SSB1056": 118, |
|
"SSB1064": 119, |
|
"SSB1072": 120, |
|
"SSB1091": 121, |
|
"SSB1096": 122, |
|
"SSB1100": 123, |
|
"SSB1108": 124, |
|
"SSB1115": 125, |
|
"SSB1125": 126, |
|
"SSB1131": 127, |
|
"SSB1136": 128, |
|
"SSB1138": 129, |
|
"SSB1161": 130, |
|
"SSB1203": 131, |
|
"SSB1204": 132, |
|
"SSB1218": 133, |
|
"SSB1221": 134, |
|
"SSB1253": 135, |
|
"SSB1320": 136, |
|
"SSB1341": 137, |
|
"SSB1366": 138, |
|
"SSB1377": 139, |
|
"SSB1383": 140, |
|
"SSB1385": 141, |
|
"SSB1392": 142, |
|
"SSB1393": 143, |
|
"SSB1408": 144, |
|
"SSB1431": 145, |
|
"SSB1437": 146, |
|
"SSB1448": 147, |
|
"SSB1555": 148, |
|
"SSB1563": 149, |
|
"SSB1567": 150, |
|
"SSB1575": 151, |
|
"SSB1585": 152, |
|
"SSB1593": 153, |
|
"SSB1607": 154, |
|
"SSB1624": 155, |
|
"SSB1625": 156, |
|
"SSB1630": 157, |
|
"SSB1650": 158, |
|
"SSB1670": 159, |
|
"SSB1684": 160, |
|
"SSB1686": 161, |
|
"SSB1699": 162, |
|
"SSB1711": 163, |
|
"SSB1759": 164, |
|
"SSB1806": 165, |
|
"SSB1828": 166, |
|
"SSB1831": 167, |
|
"SSB1832": 168, |
|
"SSB1837": 169, |
|
"SSB1846": 170, |
|
"SSB1863": 171, |
|
"SSB1878": 172, |
|
"SSB1891": 173, |
|
"SSB1918": 174, |
|
"SSB1935": 175, |
|
"SSB1939": 176, |
|
"SSB1956": 177, |
|
"SSB0693": 178, |
|
"SSB0711": 179, |
|
"SSB0716": 180, |
|
"SSB0717": 181, |
|
"SSB0736": 182, |
|
"SSB0749": 183, |
|
"SSB0809": 184, |
|
"SSB0702": 185, |
|
"SSB0822": 186, |
|
"SSB1110": 187, |
|
"SSB1215": 188, |
|
"SSB1399": 189, |
|
"SSB1728": 190, |
|
"SSB0993": 191, |
|
"SSB0997": 192, |
|
"SSB1000": 193, |
|
"SSB1001": 194, |
|
"SSB1002": 195, |
|
"SSB1126": 196, |
|
"SSB1135": 197, |
|
"SSB1176": 198, |
|
"SSB1187": 199, |
|
"SSB1197": 200, |
|
"SSB1216": 201, |
|
"SSB1219": 202, |
|
"SSB1239": 203, |
|
"SSB1274": 204, |
|
"SSB1302": 205, |
|
"SSB1322": 206, |
|
"SSB1328": 207, |
|
"SSB1340": 208, |
|
"SSB1365": 209, |
|
"SSB1382": 210, |
|
"SSB1402": 211, |
|
"SSB1452": 212, |
|
"SSB1457": 213, |
|
"SSB1739": 214, |
|
"SSB1745": 215, |
|
"SSB1781": 216, |
|
"SSB1782": 217, |
|
"SSB1809": 218, |
|
"SSB1810": 219, |
|
"SSB1872": 220, |
|
"SSB1902": 221, |
|
"小庄": 222, |
|
"小嘟": 223 |
|
} |
|
}, |
|
"model": { |
|
"use_spk_conditioned_encoder": true, |
|
"use_noise_scaled_mas": true, |
|
"use_mel_posterior_encoder": false, |
|
"use_duration_discriminator": true, |
|
"inter_channels": 192, |
|
"hidden_channels": 192, |
|
"filter_channels": 768, |
|
"n_heads": 2, |
|
"n_layers": 6, |
|
"kernel_size": 3, |
|
"p_dropout": 0.1, |
|
"resblock": "1", |
|
"resblock_kernel_sizes": [ |
|
3, |
|
7, |
|
11 |
|
], |
|
"resblock_dilation_sizes": [ |
|
[ |
|
1, |
|
3, |
|
5 |
|
], |
|
[ |
|
1, |
|
3, |
|
5 |
|
], |
|
[ |
|
1, |
|
3, |
|
5 |
|
] |
|
], |
|
"upsample_rates": [ |
|
8, |
|
8, |
|
2, |
|
2, |
|
2 |
|
], |
|
"upsample_initial_channel": 512, |
|
"upsample_kernel_sizes": [ |
|
16, |
|
16, |
|
8, |
|
2, |
|
2 |
|
], |
|
"n_layers_q": 3, |
|
"use_spectral_norm": false, |
|
"gin_channels": 256 |
|
}, |
|
"version": "2.0" |
|
} |