Spaces:
Running
on
T4
Running
on
T4
File size: 1,722 Bytes
b725c5a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 |
{
"base_config": "config/base.json",
"dataset": [
"LJSpeech",
"LibriTTS",
"opencpop",
"m4singer",
"svcc",
"svcceval",
"pjs",
"opensinger",
"popbutfy",
"nus48e",
"popcs",
"kising",
"csd",
"opera",
"vctk",
"lijian",
"cdmusiceval"
],
"task_type": "vocoder",
"preprocess": {
// acoustic features
"extract_mel": true,
"extract_pitch": false,
"extract_uv": false,
"extract_audio": true,
"extract_label": false,
"extract_one_hot": false,
"extract_amplitude_phase": false,
"pitch_extractor": "parselmouth",
// Settings for data preprocessing
"n_mel": 100,
"win_size": 1024,
"hop_size": 256,
"sample_rate": 24000,
"n_fft": 1024,
"fmin": 0,
"fmax": 12000,
"f0_min": 50,
"f0_max": 1100,
"pitch_bin": 256,
"pitch_max": 1100.0,
"pitch_min": 50.0,
"is_mu_law": false,
"bits": 8,
"cut_mel_frame": 32,
// Directory names of processed data or extracted features
"spk2id": "singers.json",
// Features used for model training
"use_mel": true,
"use_frame_pitch": false,
"use_uv": false,
"use_audio": true,
"use_label": false,
"use_one_hot": false,
"train_file": "train.json",
"valid_file": "test.json"
},
"train": {
"random_seed": 114514,
"batch_size": 64,
"gradient_accumulation_step": 1,
"max_epoch": 1000000,
"save_checkpoint_stride": [
20
],
"run_eval": [
true
],
"sampler": {
"holistic_shuffle": true,
"drop_last": true
},
"dataloader": {
"num_worker": 4,
"pin_memory": true
},
"tracker": [
"tensorboard"
],
}
} |