Kamtera commited on
Commit
f3abfc1
1 Parent(s): a7ae07b

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +7 -32
config.json CHANGED
@@ -27,8 +27,8 @@
27
  "batch_size": 8,
28
  "eval_batch_size": 4,
29
  "grad_clip": [
30
- 1000,
31
- 1000
32
  ],
33
  "scheduler_after_epoch": true,
34
  "lr": 0.001,
@@ -54,37 +54,12 @@
54
  "use_noise_augment": false,
55
  "audio": {
56
  "fft_size": 1024,
 
57
  "win_length": 1024,
58
  "hop_length": 256,
59
- "frame_shift_ms": null,
60
- "frame_length_ms": null,
61
- "stft_pad_mode": "reflect",
62
- "sample_rate": 22050,
63
- "resample": false,
64
- "preemphasis": 0.0,
65
- "ref_level_db": 20,
66
- "do_sound_norm": false,
67
- "log_func": "np.log10",
68
- "do_trim_silence": false,
69
- "trim_db": 45,
70
- "do_rms_norm": false,
71
- "db_level": null,
72
- "power": 1.5,
73
- "griffin_lim_iters": 60,
74
  "num_mels": 80,
75
  "mel_fmin": 0,
76
- "mel_fmax": null,
77
- "spec_gain": 20,
78
- "do_amp_to_db_linear": true,
79
- "do_amp_to_db_mel": true,
80
- "pitch_fmax": 640.0,
81
- "pitch_fmin": 1.0,
82
- "signal_norm": true,
83
- "min_level_db": -100,
84
- "symmetric_norm": true,
85
- "max_norm": 4.0,
86
- "clip_norm": true,
87
- "stats_path": null
88
  },
89
  "use_phonemes": true,
90
  "phonemizer": "espeak",
@@ -244,7 +219,7 @@
244
  "use_sdp": true,
245
  "noise_scale": 1.0,
246
  "inference_noise_scale": 0.667,
247
- "length_scale": 1,
248
  "noise_scale_dp": 1.0,
249
  "inference_noise_scale_dp": 1.0,
250
  "max_inference_len": null,
@@ -252,7 +227,7 @@
252
  "use_spectral_norm_disriminator": false,
253
  "use_speaker_embedding": false,
254
  "num_speakers": 0,
255
- "speakers_file": "/kaggle/working/train_output/kagg/speakers.pth",
256
  "d_vector_file": null,
257
  "speaker_embedding_channels": 256,
258
  "use_d_vector_file": false,
@@ -302,7 +277,7 @@
302
  "r": 1,
303
  "num_speakers": 3,
304
  "use_speaker_embedding": false,
305
- "speakers_file": "/kaggle/working/train_output/kagg/speakers.pth",
306
  "speaker_embedding_channels": 256,
307
  "language_ids_file": null,
308
  "use_language_embedding": false,
 
27
  "batch_size": 8,
28
  "eval_batch_size": 4,
29
  "grad_clip": [
30
+ 1000.0,
31
+ 1000.0
32
  ],
33
  "scheduler_after_epoch": true,
34
  "lr": 0.001,
 
54
  "use_noise_augment": false,
55
  "audio": {
56
  "fft_size": 1024,
57
+ "sample_rate": 22050,
58
  "win_length": 1024,
59
  "hop_length": 256,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
60
  "num_mels": 80,
61
  "mel_fmin": 0,
62
+ "mel_fmax": null
 
 
 
 
 
 
 
 
 
 
 
63
  },
64
  "use_phonemes": true,
65
  "phonemizer": "espeak",
 
219
  "use_sdp": true,
220
  "noise_scale": 1.0,
221
  "inference_noise_scale": 0.667,
222
+ "length_scale": 1.0,
223
  "noise_scale_dp": 1.0,
224
  "inference_noise_scale_dp": 1.0,
225
  "max_inference_len": null,
 
227
  "use_spectral_norm_disriminator": false,
228
  "use_speaker_embedding": false,
229
  "num_speakers": 0,
230
+ "speakers_file": "train_output/kagg/speakers.pth",
231
  "d_vector_file": null,
232
  "speaker_embedding_channels": 256,
233
  "use_d_vector_file": false,
 
277
  "r": 1,
278
  "num_speakers": 3,
279
  "use_speaker_embedding": false,
280
+ "speakers_file": "train_output/kagg/speakers.pth",
281
  "speaker_embedding_channels": 256,
282
  "language_ids_file": null,
283
  "use_language_embedding": false,