File size: 746 Bytes
f79a1ca
 
 
 
 
 
0e947f2
2a2af5c
0e947f2
 
f79a1ca
 
 
 
0e947f2
 
 
 
 
 
 
f79a1ca
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
# STFT arguments
sample_rate: 16000
n_fft: 512
win_length: 32
hop_length: 16

mask_weight: 0.99

# Enhancement model args
enhance_model: !new:speechbrain.lobes.models.EnhanceResnet.EnhanceResnet
    n_fft: !ref <n_fft>
    win_length: !ref <win_length>
    hop_length: !ref <hop_length>
    sample_rate: !ref <sample_rate>
    channel_counts: [128, 128, 256, 256, 512, 512]
    normalization: !name:speechbrain.nnet.normalization.BatchNorm2d
    activation: !new:torch.nn.GELU
    dense_count: 2
    dense_nodes: 1024
    dropout: 0.1
    mask_weight: !ref <mask_weight>

modules:
    enhance_model: !ref <enhance_model>

pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
    loadables:
        enhance_model: !ref <enhance_model>