Upload config.yaml
Browse files- config.yaml +50 -0
config.yaml
ADDED
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model:
|
2 |
+
class_path: vocos.experiment.VocosEncodecExp
|
3 |
+
init_args:
|
4 |
+
sample_rate: 24000
|
5 |
+
initial_learning_rate: 5e-4
|
6 |
+
mel_loss_coeff: 45
|
7 |
+
mrd_loss_coeff: 1.0
|
8 |
+
num_warmup_steps: 0 # Optimizers warmup steps
|
9 |
+
pretrain_mel_steps: 0 # 0 means GAN objective from the first iteration
|
10 |
+
|
11 |
+
# automatic evaluation
|
12 |
+
evaluate_utmos: true
|
13 |
+
evaluate_pesq: true
|
14 |
+
evaluate_periodicty: true
|
15 |
+
|
16 |
+
feature_extractor:
|
17 |
+
class_path: vocos.feature_extractors.EncodecFeatures
|
18 |
+
init_args:
|
19 |
+
encodec_model: encodec_24khz
|
20 |
+
bandwidths: [1.5, 3.0, 6.0, 12.0]
|
21 |
+
train_codebooks: false
|
22 |
+
|
23 |
+
backbone:
|
24 |
+
class_path: vocos.models.VocosBackbone
|
25 |
+
init_args:
|
26 |
+
input_channels: 128
|
27 |
+
dim: 384
|
28 |
+
intermediate_dim: 1152
|
29 |
+
num_layers: 8
|
30 |
+
adanorm_num_embeddings: 4 # len(bandwidths)
|
31 |
+
|
32 |
+
head:
|
33 |
+
class_path: vocos.heads.WaveNextHead
|
34 |
+
init_args:
|
35 |
+
dim: 384
|
36 |
+
n_fft: 1280
|
37 |
+
hop_length: 320
|
38 |
+
padding: same
|
39 |
+
|
40 |
+
melspec_loss:
|
41 |
+
class_path: vocos.loss.MelSpecReconstructionLoss
|
42 |
+
init_args:
|
43 |
+
sample_rate: 24000
|
44 |
+
n_fft: 1024
|
45 |
+
hop_length: 256
|
46 |
+
n_mels: 128
|
47 |
+
f_min: 0
|
48 |
+
f_max: 12000
|
49 |
+
clip_val: 1e-7
|
50 |
+
|