Gluttony10 commited on
Commit
205ca43
1 Parent(s): 138e6cc

Upload 2 files

Browse files
Files changed (2) hide show
  1. config.json +21 -10
  2. config.yml +31 -10
config.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "train": {
3
- "log_interval": 500,
4
- "eval_interval": 500,
5
  "seed": 42,
6
- "epochs": 1000,
7
  "learning_rate": 0.0001,
8
  "betas": [
9
  0.8,
@@ -11,14 +11,19 @@
11
  ],
12
  "eps": 1e-09,
13
  "batch_size": 8,
14
- "fp16_run": false,
15
  "lr_decay": 0.99995,
16
  "segment_size": 16384,
17
  "init_lr_ratio": 1,
18
  "warmup_epochs": 0,
19
  "c_mel": 45,
20
  "c_kl": 1.0,
21
- "skip_optimizer": true
 
 
 
 
 
22
  },
23
  "data": {
24
  "training_files": "Data/glut/filelists/train.list",
@@ -32,14 +37,13 @@
32
  "mel_fmin": 0.0,
33
  "mel_fmax": null,
34
  "add_blank": true,
35
- "n_speakers": 896,
36
  "cleaned_text": true,
37
  "spk2id": {
38
  "16": 0,
39
  "G": 1,
40
  "M": 2,
41
- "S": 3,
42
- "Y": 4
43
  }
44
  },
45
  "model": {
@@ -94,7 +98,14 @@
94
  ],
95
  "n_layers_q": 3,
96
  "use_spectral_norm": false,
97
- "gin_channels": 256
 
 
 
 
 
 
 
98
  },
99
- "version": "2.1"
100
  }
 
1
  {
2
  "train": {
3
+ "log_interval": 1000,
4
+ "eval_interval": 1000,
5
  "seed": 42,
6
+ "epochs": 10000,
7
  "learning_rate": 0.0001,
8
  "betas": [
9
  0.8,
 
11
  ],
12
  "eps": 1e-09,
13
  "batch_size": 8,
14
+ "bf16_run": false,
15
  "lr_decay": 0.99995,
16
  "segment_size": 16384,
17
  "init_lr_ratio": 1,
18
  "warmup_epochs": 0,
19
  "c_mel": 45,
20
  "c_kl": 1.0,
21
+ "c_commit": 100,
22
+ "skip_optimizer": true,
23
+ "freeze_ZH_bert": false,
24
+ "freeze_JP_bert": false,
25
+ "freeze_EN_bert": false,
26
+ "freeze_emo": false
27
  },
28
  "data": {
29
  "training_files": "Data/glut/filelists/train.list",
 
37
  "mel_fmin": 0.0,
38
  "mel_fmax": null,
39
  "add_blank": true,
40
+ "n_speakers": 4,
41
  "cleaned_text": true,
42
  "spk2id": {
43
  "16": 0,
44
  "G": 1,
45
  "M": 2,
46
+ "Y": 3
 
47
  }
48
  },
49
  "model": {
 
98
  ],
99
  "n_layers_q": 3,
100
  "use_spectral_norm": false,
101
+ "gin_channels": 512,
102
+ "slm": {
103
+ "model": "./slm/wavlm-base-plus",
104
+ "sr": 16000,
105
+ "hidden": 768,
106
+ "nlayers": 13,
107
+ "initial_channel": 64
108
+ }
109
  },
110
+ "version": "2.3"
111
  }
config.yml CHANGED
@@ -3,11 +3,12 @@ bert_gen:
3
  device: cuda
4
  num_processes: 2
5
  use_multi_device: false
6
- dataset_path: Data/glut
7
  emo_gen:
8
  config_path: config.json
9
  device: cuda
10
  num_processes: 2
 
11
  mirror: ''
12
  openi_token: ''
13
  preprocess_text:
@@ -18,23 +19,43 @@ preprocess_text:
18
  train_path: filelists/train.list
19
  transcription_path: filelists/short_character_anno.list
20
  val_path: filelists/val.list
21
- val_per_spk: 4
22
  resample:
23
- in_dir: custom_character_voice
24
- out_dir: custom_character_voice
25
  sampling_rate: 44100
26
  server:
27
  device: cuda
28
  models:
29
- - config: Data/glut/config.json
30
  device: cuda
31
  language: ZH
32
- model: Data/glut/models/G_1000.pth
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  speakers: []
34
  port: 5000
35
  train_ms:
36
  base:
37
- model_image: "Bert-VITS2_2.1-Emo\u5E95\u6A21"
38
  repo_id: Stardust_minus/Bert-VITS2
39
  use_base_model: false
40
  config_path: config.json
@@ -46,16 +67,16 @@ train_ms:
46
  WORLD_SIZE: 1
47
  keep_ckpts: 10
48
  model: models
49
- num_workers: 4
50
  spec_cache: true
51
  translate:
52
  app_key: ''
53
  secret_key: ''
54
  webui:
55
- config_path: configs/config.json
56
  debug: false
57
  device: cuda
58
  language_identification_library: langid
59
- model: genshin/models/G_8000.pth
60
  port: 7860
61
  share: false
 
3
  device: cuda
4
  num_processes: 2
5
  use_multi_device: false
6
+ dataset_path: Data\glut
7
  emo_gen:
8
  config_path: config.json
9
  device: cuda
10
  num_processes: 2
11
+ use_multi_device: false
12
  mirror: ''
13
  openi_token: ''
14
  preprocess_text:
 
19
  train_path: filelists/train.list
20
  transcription_path: filelists/short_character_anno.list
21
  val_path: filelists/val.list
22
+ val_per_lang: 4
23
  resample:
24
+ in_dir: raw
25
+ out_dir: wavs
26
  sampling_rate: 44100
27
  server:
28
  device: cuda
29
  models:
30
+ - config: ''
31
  device: cuda
32
  language: ZH
33
+ model: ''
34
+ speakers:
35
+ - length_scale: 1
36
+ noise_scale: 0.6
37
+ noise_scale_w: 0.8
38
+ sdp_ratio: 0.2
39
+ speaker: "\u79D1\u6BD4"
40
+ - length_scale: 0.5
41
+ noise_scale: 0.7
42
+ noise_scale_w: 0.8
43
+ sdp_ratio: 0.3
44
+ speaker: "\u4E94\u6761\u609F"
45
+ - length_scale: 1.2
46
+ noise_scale: 0.6
47
+ noise_scale_w: 0.8
48
+ sdp_ratio: 0.2
49
+ speaker: "\u5B89\u500D\u664B\u4E09"
50
+ - config: ''
51
+ device: cpu
52
+ language: JP
53
+ model: ''
54
  speakers: []
55
  port: 5000
56
  train_ms:
57
  base:
58
+ model_image: "Bert-VITS2_2.3\u5E95\u6A21"
59
  repo_id: Stardust_minus/Bert-VITS2
60
  use_base_model: false
61
  config_path: config.json
 
67
  WORLD_SIZE: 1
68
  keep_ckpts: 10
69
  model: models
70
+ num_workers: 2
71
  spec_cache: true
72
  translate:
73
  app_key: ''
74
  secret_key: ''
75
  webui:
76
+ config_path: config.json
77
  debug: false
78
  device: cuda
79
  language_identification_library: langid
80
+ model: models/G_8000.pth
81
  port: 7860
82
  share: false