File size: 1,326 Bytes
8c92a11 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 |
{
"base_config": "egs/vocoder/gan/exp_config_base.json",
"preprocess": {
// acoustic features
"extract_mel": true,
"extract_audio": true,
"extract_pitch": true,
// Features used for model training
"use_mel": true,
"use_audio": true,
"use_frame_pitch": true
},
"model": {
"generator": "nsfhifigan",
"nsfhifigan": {
"resblock": "1",
"harmonic_num": 8,
"upsample_rates": [
8,
4,
2,
2,
2
],
"upsample_kernel_sizes": [
16,
8,
4,
4,
4
],
"upsample_initial_channel": 768,
"resblock_kernel_sizes": [
3,
7,
11
],
"resblock_dilation_sizes": [
[
1,
3,
5
],
[
1,
3,
5
],
[
1,
3,
5
]
]
},
"mpd": {
"mpd_reshapes": [
2,
3,
5,
7,
11,
17,
23,
37
],
"use_spectral_norm": false,
"discriminator_channel_multi": 1
}
},
"train": {
"criterions": [
"feature",
"discriminator",
"generator",
"mel",
]
},
"inference": {
"batch_size": 1,
}
}
|