Upload config.json with huggingface_hub
Browse files- config.json +7 -32
config.json
CHANGED
@@ -27,8 +27,8 @@
|
|
27 |
"batch_size": 8,
|
28 |
"eval_batch_size": 4,
|
29 |
"grad_clip": [
|
30 |
-
1000,
|
31 |
-
1000
|
32 |
],
|
33 |
"scheduler_after_epoch": true,
|
34 |
"lr": 0.001,
|
@@ -54,37 +54,12 @@
|
|
54 |
"use_noise_augment": false,
|
55 |
"audio": {
|
56 |
"fft_size": 1024,
|
|
|
57 |
"win_length": 1024,
|
58 |
"hop_length": 256,
|
59 |
-
"frame_shift_ms": null,
|
60 |
-
"frame_length_ms": null,
|
61 |
-
"stft_pad_mode": "reflect",
|
62 |
-
"sample_rate": 22050,
|
63 |
-
"resample": false,
|
64 |
-
"preemphasis": 0.0,
|
65 |
-
"ref_level_db": 20,
|
66 |
-
"do_sound_norm": false,
|
67 |
-
"log_func": "np.log10",
|
68 |
-
"do_trim_silence": false,
|
69 |
-
"trim_db": 45,
|
70 |
-
"do_rms_norm": false,
|
71 |
-
"db_level": null,
|
72 |
-
"power": 1.5,
|
73 |
-
"griffin_lim_iters": 60,
|
74 |
"num_mels": 80,
|
75 |
"mel_fmin": 0,
|
76 |
-
"mel_fmax": null
|
77 |
-
"spec_gain": 20,
|
78 |
-
"do_amp_to_db_linear": true,
|
79 |
-
"do_amp_to_db_mel": true,
|
80 |
-
"pitch_fmax": 640.0,
|
81 |
-
"pitch_fmin": 1.0,
|
82 |
-
"signal_norm": true,
|
83 |
-
"min_level_db": -100,
|
84 |
-
"symmetric_norm": true,
|
85 |
-
"max_norm": 4.0,
|
86 |
-
"clip_norm": true,
|
87 |
-
"stats_path": null
|
88 |
},
|
89 |
"use_phonemes": true,
|
90 |
"phonemizer": "espeak",
|
@@ -244,7 +219,7 @@
|
|
244 |
"use_sdp": true,
|
245 |
"noise_scale": 1.0,
|
246 |
"inference_noise_scale": 0.667,
|
247 |
-
"length_scale": 1,
|
248 |
"noise_scale_dp": 1.0,
|
249 |
"inference_noise_scale_dp": 1.0,
|
250 |
"max_inference_len": null,
|
@@ -252,7 +227,7 @@
|
|
252 |
"use_spectral_norm_disriminator": false,
|
253 |
"use_speaker_embedding": false,
|
254 |
"num_speakers": 0,
|
255 |
-
"speakers_file": "
|
256 |
"d_vector_file": null,
|
257 |
"speaker_embedding_channels": 256,
|
258 |
"use_d_vector_file": false,
|
@@ -302,7 +277,7 @@
|
|
302 |
"r": 1,
|
303 |
"num_speakers": 3,
|
304 |
"use_speaker_embedding": false,
|
305 |
-
"speakers_file": "
|
306 |
"speaker_embedding_channels": 256,
|
307 |
"language_ids_file": null,
|
308 |
"use_language_embedding": false,
|
|
|
27 |
"batch_size": 8,
|
28 |
"eval_batch_size": 4,
|
29 |
"grad_clip": [
|
30 |
+
1000.0,
|
31 |
+
1000.0
|
32 |
],
|
33 |
"scheduler_after_epoch": true,
|
34 |
"lr": 0.001,
|
|
|
54 |
"use_noise_augment": false,
|
55 |
"audio": {
|
56 |
"fft_size": 1024,
|
57 |
+
"sample_rate": 22050,
|
58 |
"win_length": 1024,
|
59 |
"hop_length": 256,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
60 |
"num_mels": 80,
|
61 |
"mel_fmin": 0,
|
62 |
+
"mel_fmax": null
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
63 |
},
|
64 |
"use_phonemes": true,
|
65 |
"phonemizer": "espeak",
|
|
|
219 |
"use_sdp": true,
|
220 |
"noise_scale": 1.0,
|
221 |
"inference_noise_scale": 0.667,
|
222 |
+
"length_scale": 1.0,
|
223 |
"noise_scale_dp": 1.0,
|
224 |
"inference_noise_scale_dp": 1.0,
|
225 |
"max_inference_len": null,
|
|
|
227 |
"use_spectral_norm_disriminator": false,
|
228 |
"use_speaker_embedding": false,
|
229 |
"num_speakers": 0,
|
230 |
+
"speakers_file": "train_output/kagg/speakers.pth",
|
231 |
"d_vector_file": null,
|
232 |
"speaker_embedding_channels": 256,
|
233 |
"use_d_vector_file": false,
|
|
|
277 |
"r": 1,
|
278 |
"num_speakers": 3,
|
279 |
"use_speaker_embedding": false,
|
280 |
+
"speakers_file": "train_output/kagg/speakers.pth",
|
281 |
"speaker_embedding_channels": 256,
|
282 |
"language_ids_file": null,
|
283 |
"use_language_embedding": false,
|