speechbrain
/

metricgan-plus-voicebank

speech-enhancement

Model card Files Files and versions Community

metricgan-plus-voicebank / hyperparams.yaml

pplantinga's picture

Add PESQ 3.15 model

85b2091 over 3 years ago

history blame contribute delete

1.12 kB

	# STFT parameters
	sample_rate: 16000
	win_length: 32
	hop_length: 16
	n_fft: 512
	window_fn: !name:torch.hamming_window

	compute_stft: !new:speechbrain.processing.features.STFT
	sample_rate: !ref <sample_rate>
	n_fft: !ref <n_fft>
	win_length: !ref <win_length>
	hop_length: !ref <hop_length>
	window_fn: !ref <window_fn>

	compute_istft: !new:speechbrain.processing.features.ISTFT
	sample_rate: !ref <sample_rate>
	n_fft: !ref <n_fft>
	win_length: !ref <win_length>
	hop_length: !ref <hop_length>
	window_fn: !ref <window_fn>

	spectral_magnitude: !name:speechbrain.processing.features.spectral_magnitude
	power: 0.5

	resynth: !name:speechbrain.processing.signal_processing.resynthesize
	stft: !ref <compute_stft>
	istft: !ref <compute_istft>

	enhance_model: !new:speechbrain.lobes.models.MetricGAN.EnhancementGenerator
	input_size: !ref <n_fft> // 2 + 1
	hidden_size: 200
	num_layers: 2
	dropout: 0

	modules:
	enhance_model: !ref <enhance_model>

	pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
	loadables:
	enhance_model: !ref <enhance_model>