so-vits-svc3.0_big / config_64.json
ciferecavivon's picture
Upload 2 files
ebcafba
{
"train": {
"log_interval": 100,
"eval_interval": 2500,
"seed": 2078,
"epochs": 10000,
"learning_rate": 0.000998,
"betas": [
0.8,
0.99
],
"eps": 1e-09,
"batch_size": 12,
"fp16_run": false,
"lr_decay": 0.999875,
"segment_size": 17920,
"init_lr_ratio": 1,
"warmup_epochs": 0,
"c_mel": 45,
"c_kl": 1.0,
"use_sr": true,
"max_speclen": 384,
"port": "8001"
},
"data": {
"training_files": "filelists/train.txt",
"validation_files": "filelists/val.txt",
"max_wav_value": 32768.0,
"sampling_rate": 32000,
"filter_length": 1280,
"hop_length": 320,
"win_length": 1280,
"n_mel_channels": 80,
"mel_fmin": 0.0,
"mel_fmax": null
},
"model": {
"inter_channels": 192,
"hidden_channels": 192,
"filter_channels": 768,
"n_heads": 2,
"n_layers": 6,
"kernel_size": 3,
"p_dropout": 0.1,
"resblock": "1",
"resblock_kernel_sizes": [
3,
7,
11
],
"resblock_dilation_sizes": [
[
1,
3,
5
],
[
1,
3,
5
],
[
1,
3,
5
]
],
"upsample_rates": [
10,
8,
2,
2
],
"upsample_initial_channel": 512,
"upsample_kernel_sizes": [
16,
16,
4,
4
],
"n_layers_q": 3,
"use_spectral_norm": false,
"gin_channels": 256,
"ssl_dim": 256,
"n_speakers": 64
},
"spk": {
"0":0,
"1":1,
"2":2,
"3":3,
"4":4,
"5":5,
"6":6,
"7":7,
"8":8,
"9":9,
"10":10,
"11":11,
"12":12,
"13":13,
"14":14,
"15":15,
"16":16,
"17":17,
"18":18,
"19":19,
"20":20,
"21":21,
"22":22,
"23":23,
"24":24,
"25":25,
"26":26,
"27":27,
"28":28,
"29":29,
"30":30,
"31":31,
"32":32,
"33":33,
"34":34,
"35":35,
"36":36,
"37":37,
"38":38,
"39":39,
"40":40,
"41":41,
"42":42,
"43":43,
"44":44,
"45":45,
"46":46,
"47":47,
"48":48,
"49":49,
"50":50,
"51":51,
"52":52,
"53":53,
"54":54,
"55":55,
"56":56,
"57":57,
"58":58,
"59":59,
"60":60,
"61":61,
"62":62,
"63":63
}
}