|
defaults:
|
|
- common
|
|
|
|
train:
|
|
batch_size: 128
|
|
betas: [0.8, 0.99]
|
|
c_kl: 1.0
|
|
c_mel: 45
|
|
distributed: false
|
|
use_multiprocessing: false
|
|
epochs: 20
|
|
eps: 1e-9
|
|
fp16_run: false
|
|
init_lr_ratio: 1
|
|
raise_error: false
|
|
learning_rate: 2e-4
|
|
log_interval: 10
|
|
log_level: ${log_level}
|
|
lr_decay: 0.98
|
|
max_speclen: 128
|
|
port: 8005
|
|
resume_training: false
|
|
seed: 1234
|
|
segment_size: 8960
|
|
use_sr: false
|
|
valid_epoch_interval: 1
|
|
valid_steps_interval: 1000
|
|
save_epoch_interval: 10
|
|
save_steps_interval: 1000
|
|
warmup_epochs: 0
|
|
|
|
|
|
weighted_batch_speaker_sampling : 0.5
|
|
weighted_batch_lang_sampling : 0.5
|
|
|
|
data:
|
|
dataset_dir: /raid/lucasgris/free-svc/data
|
|
filter_length: 1280
|
|
hop_length: 320
|
|
max_wav_value: 32768.0
|
|
mel_fmax: null
|
|
mel_fmin: 0.0
|
|
n_mel_channels: 80
|
|
num_workers: 64
|
|
|
|
pitch_predictor: rmvpe
|
|
pitch_features_dir: ${data.dataset_dir}/pitch_features/
|
|
sampling_rate: 24000
|
|
spectrogram_dir: null
|
|
|
|
use_spk_emb: true
|
|
spk_embeddings_dir: ${data.dataset_dir}/spk_embeddings
|
|
|
|
sr_min_max: [68, 92]
|
|
|
|
content_feature_dir: null
|
|
training_files: data/train.csv
|
|
validation_files: data/valid.csv
|
|
win_length: 1280
|
|
|
|
model:
|
|
save_dir: null
|
|
filter_channels: 768
|
|
finetune_from_model:
|
|
discriminator: /raid/lucasgris/free-svc/D-freevc-24.pth
|
|
generator: /raid/lucasgris/free-svc/freevc-24.pth
|
|
hidden_channels: 192
|
|
inter_channels: 192
|
|
kernel_size: 3
|
|
n_heads: 2
|
|
n_layers_q: 3
|
|
n_layers: 6
|
|
p_dropout: 0.1
|
|
resblock_dilation_sizes: [[1,3,5], [1,3,5], [1,3,5]]
|
|
resblock_kernel_sizes: [3,7,11]
|
|
resblock: 1
|
|
c_dim: 768
|
|
upsample_initial_channel: 512
|
|
upsample_kernel_sizes: [16,16,4,4]
|
|
upsample_rates: [10,8,2,2]
|
|
use_spectral_norm: false
|
|
freeze_external_spk: true
|
|
device: cuda
|
|
|
|
use_spk_emb: false
|
|
gin_channels: null
|
|
spk_encoder_type: null
|
|
|
|
content_encoder_type: null
|
|
content_encoder_ckpt: null
|
|
post_content_encoder_type: vits-encoder-with-uv-emb
|
|
coarse_f0: true
|
|
cond_f0_on_flow: false
|
|
|