K_step: 1000 accumulate_grad_batches: 1 audio_num_mel_bins: 128 audio_sample_rate: 44100 binarization_args: shuffle: false with_align: true with_f0: true with_hubert: true with_spk_embed: false with_wav: false binarizer_cls: preprocessing.SVCpre.SVCBinarizer binary_data_dir: data/binary/aquapre check_val_every_n_epoch: 10 choose_test_manually: false clip_grad_norm: 1 config_path: F:\diff-svc-main\training\config_nsf.yaml content_cond_steps: [] cwt_add_f0_loss: false cwt_hidden_size: 128 cwt_layers: 2 cwt_loss: l1 cwt_std_scale: 0.8 datasets: - opencpop debug: false dec_ffn_kernel_size: 9 dec_layers: 4 decay_steps: 20000 decoder_type: fft dict_dir: '' diff_decoder_type: wavenet diff_loss_type: l2 dilation_cycle_length: 4 dropout: 0.1 ds_workers: 4 dur_enc_hidden_stride_kernel: - 0,2,3 - 0,2,3 - 0,1,3 dur_loss: mse dur_predictor_kernel: 3 dur_predictor_layers: 5 enc_ffn_kernel_size: 9 enc_layers: 4 encoder_K: 8 encoder_type: fft endless_ds: false f0_bin: 256 f0_max: 1100.0 f0_min: 40.0 f0_static: '{"28.0": 0.07, "29.0": 0.03, "31.0": 0.05, "32.0": 0.08, "33.0": 0.12, "34.0": 0.02, "35.0": 0.06, "36.0": 0.02, "37.0": 0.01, "38.0": 0.1, "39.0": 0.05, "40.0": 0.09, "41.0": 0.14, "42.0": 0.16, "43.0": 0.03, "44.0": 0.42, "45.0": 0.74, "46.0": 1.13, "47.0": 1.49, "48.0": 1.76, "49.0": 2.59, "50.0": 3.03, "51.0": 2.71, "52.0": 1.93, "53.0": 1.11, "54.0": 0.78, "55.0": 3.33, "56.0": 20.38, "57.0": 69.6, "58.0": 167.04, "59.0": 245.1, "60.0": 318.87, "61.0": 373.41, "62.0": 434.86, "63.0": 415.63, "64.0": 448.97, "65.0": 452.99, "66.0": 474.88, "67.0": 471.54, "68.0": 455.78, "69.0": 421.71, "70.0": 372.06, "71.0": 323.85, "72.0": 292.8, "73.0": 238.94, "74.0": 190.5, "75.0": 132.86, "76.0": 88.03, "77.0": 53.16, "78.0": 32.96, "79.0": 23.66, "80.0": 14.74, "81.0": 8.54, "82.0": 5.0, "83.0": 3.32, "84.0": 2.29, "85.0": 0.91, "total_time": 6576.43}' ffn_act: gelu ffn_padding: SAME fft_size: 2048 fmax: 16000 fmin: 40 fs2_ckpt: '' gaussian_start: true gen_dir_name: '' gen_tgt_spk_id: -1 hidden_size: 256 hop_size: 512 hubert_gpu: true hubert_path: checkpoints/hubert/hubert_soft.pt infer: false keep_bins: 128 lambda_commit: 0.25 lambda_energy: 0.0 lambda_f0: 1.0 lambda_ph_dur: 0.3 lambda_sent_dur: 1.0 lambda_uv: 1.0 lambda_word_dur: 1.0 load_ckpt: '' log_interval: 100 loud_norm: false lr: 0.0008 max_beta: 0.02 max_epochs: 3000 max_eval_sentences: 1 max_eval_tokens: 60000 max_frames: 42000 max_input_tokens: 6000 max_sentences: 88 max_tokens: 128000 max_updates: 1000000 mel_loss: ssim:0.5|l1:0.5 mel_vmax: 1.5 mel_vmin: -6.0 min_level_db: -120 no_fs2: true norm_type: gn num_ckpt_keep: 10 num_heads: 2 num_sanity_val_steps: 1 num_spk: 1 num_test_samples: 0 num_valid_plots: 10 optimizer_adam_beta1: 0.9 optimizer_adam_beta2: 0.98 out_wav_norm: false pe_ckpt: checkpoints/0102_xiaoma_pe/model_ckpt_steps_60000.ckpt pe_enable: false perform_enhance: true pitch_ar: false pitch_enc_hidden_stride_kernel: - 0,2,5 - 0,2,5 - 0,2,5 pitch_extractor: parselmouth pitch_loss: l2 pitch_norm: log pitch_type: frame pndm_speedup: 10 pre_align_args: allow_no_txt: false denoise: false forced_align: mfa txt_processor: zh_g2pM use_sox: true use_tone: false pre_align_cls: data_gen.singing.pre_align.SingingPreAlign predictor_dropout: 0.5 predictor_grad: 0.1 predictor_hidden: -1 predictor_kernel: 5 predictor_layers: 5 prenet_dropout: 0.5 prenet_hidden_size: 256 pretrain_fs_ckpt: '' processed_data_dir: xxx profile_infer: false raw_data_dir: data/raw/aquapre ref_norm_layer: bn rel_pos: true reset_phone_dict: true residual_channels: 512 residual_layers: 20 save_best: false save_ckpt: true save_codes: - configs - modules - src - utils save_f0: true save_gt: false schedule_type: linear seed: 1234 sort_by_len: true speaker_id: aqua spec_max: - 0.18377557396888733 - -0.33469653129577637 - -0.3073468506336212 - -0.21027648448944092 - 0.23178215324878693 - 0.5297451019287109 - 0.7021887898445129 - 0.7711099982261658 - 0.7912386059761047 - 0.6609739065170288 - 0.649876058101654 - 0.6327046751976013 - 0.6892049908638 - 0.6026111841201782 - 0.6834777593612671 - 0.7417489886283875 - 0.6040375828742981 - 0.5854794383049011 - 0.7123280167579651 - 0.5886657238006592 - 0.6135984063148499 - 0.5388530492782593 - 0.5932422280311584 - 0.535581111907959 - 0.57913738489151 - 0.6827316880226135 - 0.6265526413917542 - 0.6557696461677551 - 0.6586976647377014 - 0.5687282085418701 - 0.6218562722206116 - 0.6349128484725952 - 0.6176865100860596 - 0.6212958097457886 - 0.6277656555175781 - 0.5551338195800781 - 0.6126622557640076 - 0.5821346640586853 - 0.577056348323822 - 0.5649800300598145 - 0.5984634757041931 - 0.4873456656932831 - 0.47209471464157104 - 0.4387756586074829 - 0.4690910577774048 - 0.4616055190563202 - 0.3555675446987152 - 0.3898852467536926 - 0.3676068186759949 - 0.4632047414779663 - 0.37983986735343933 - 0.3877682685852051 - 0.3099276125431061 - 0.3261813223361969 - 0.34168118238449097 - 0.3004901111125946 - 0.3512653112411499 - 0.2647061347961426 - 0.2685043215751648 - 0.20390087366104126 - 0.1825377196073532 - 0.22067485749721527 - 0.20306138694286346 - 0.12710601091384888 - 0.10927848517894745 - 0.1117628887295723 - 0.14148156344890594 - 0.122605100274086 - 0.08032718300819397 - 0.12159623205661774 - -0.04923255369067192 - -0.07824847847223282 - 0.03441360592842102 - 0.07093964517116547 - -0.1269683688879013 - 0.0027632638812065125 - -0.045093610882759094 - -0.04115259647369385 - 0.029067598283290863 - -0.009453626349568367 - -0.0470033697783947 - -0.04894810542464256 - -0.06236470118165016 - -0.20086997747421265 - -0.2363593578338623 - -0.17289961874485016 - -0.219277486205101 - -0.2934815585613251 - -0.30551621317863464 - -0.2513120770454407 - -0.26792851090431213 - -0.33068278431892395 - -0.37532031536102295 - -0.365634560585022 - -0.3379015326499939 - -0.26979681849479675 - -0.20316314697265625 - -0.2109878957271576 - -0.16927000880241394 - -0.1698305308818817 - -0.2739156186580658 - -0.2700604200363159 - -0.32284122705459595 - -0.44529229402542114 - -0.4002469480037689 - -0.2441970407962799 - -0.19795942306518555 - -0.2462945580482483 - -0.0673084482550621 - -0.22117790579795837 - -0.21418607234954834 - -0.39467209577560425 - -0.4388139843940735 - -0.3227368891239166 - -0.30530503392219543 - -0.3201104998588562 - -0.39839836955070496 - -0.464596688747406 - -0.5399728417396545 - -0.5515261292457581 - -0.520453691482544 - -0.6714966893196106 - -0.6414765119552612 - -0.6108742356300354 - -0.6762520670890808 - -0.7067146301269531 - -0.7586700320243835 - -0.6640384793281555 spec_min: - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.999994277954102 - -4.989471912384033 - -4.999994277954102 spk_cond_steps: [] stop_token_weight: 5.0 task_cls: training.task.SVC_task.SVCTask test_ids: [] test_input_dir: '' test_num: 0 test_prefixes: - test test_set_name: test timesteps: 1000 train_set_name: train use_cn_hubert: false use_crepe: true use_denoise: false use_energy_embed: false use_gt_dur: false use_gt_f0: false use_midi: false use_nsf: true use_pitch_embed: true use_pos_embed: true use_spk_embed: false use_spk_id: false use_split_spk_id: false use_uv: false use_var_enc: false use_vec: false val_check_interval: 2000 valid_num: 0 valid_set_name: valid vocoder: network.vocoders.nsf_hifigan.NsfHifiGAN vocoder_ckpt: checkpoints/nsf_hifigan/model warmup_updates: 2000 wav2spec_eps: 1e-6 weight_decay: 0 win_size: 2048 work_dir: checkpoints/aquapre