cemsubakan commited on
Commit
25df5de
1 Parent(s): b665af3

Update hyperparams.yaml

Browse files
Files changed (1) hide show
  1. hyperparams.yaml +12 -7
hyperparams.yaml CHANGED
@@ -22,10 +22,10 @@ n_mels: 80
22
  out_n_neurons: 50
23
 
24
  # embedding_model: !new:custom_models.Conv2dEncoder_v2
25
- embedding_model: &id002 !new:speechbrain.lobes.models.PIQ.Conv2dEncoder_v2
26
  dim: 256
27
 
28
- classifier: &id003 !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier
29
  input_size: 256
30
  out_neurons: 50
31
  lin_blocks: 1
@@ -38,25 +38,30 @@ n_fft: 1024
38
  spec_mag_power: 0.5
39
  hop_length: 11.6099
40
  win_length: 23.2199
41
- compute_stft: &id005 !new:speechbrain.processing.features.STFT
42
  n_fft: 1024
43
  hop_length: 11.6099
44
  win_length: 23.2199
45
  sample_rate: 16000
46
 
47
- compute_fbank: &id006 !new:speechbrain.processing.features.Filterbank
48
  n_mels: 80
49
  n_fft: 1024
50
  sample_rate: 16000
51
 
52
- compute_istft: &id007 !new:speechbrain.processing.features.ISTFT
53
  sample_rate: 16000
54
  hop_length: 11.6099
55
  win_length: 23.2199
56
 
57
  label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
58
- psi_model: *id004
59
-
 
 
 
 
 
60
 
61
  modules:
62
  compute_stft: !ref <compute_stft>
 
22
  out_n_neurons: 50
23
 
24
  # embedding_model: !new:custom_models.Conv2dEncoder_v2
25
+ embedding_model: !new:speechbrain.lobes.models.PIQ.Conv2dEncoder_v2
26
  dim: 256
27
 
28
+ classifier: !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier
29
  input_size: 256
30
  out_neurons: 50
31
  lin_blocks: 1
 
38
  spec_mag_power: 0.5
39
  hop_length: 11.6099
40
  win_length: 23.2199
41
+ compute_stft: !new:speechbrain.processing.features.STFT
42
  n_fft: 1024
43
  hop_length: 11.6099
44
  win_length: 23.2199
45
  sample_rate: 16000
46
 
47
+ compute_fbank: !new:speechbrain.processing.features.Filterbank
48
  n_mels: 80
49
  n_fft: 1024
50
  sample_rate: 16000
51
 
52
+ compute_istft: !new:speechbrain.processing.features.ISTFT
53
  sample_rate: 16000
54
  hop_length: 11.6099
55
  win_length: 23.2199
56
 
57
  label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
58
+ psi_model: !new:speechbrain.lobes.models.PIQ.VectorQuantizedPSI_Audio
59
+ dim: 256
60
+ K: 1024
61
+ shared_keys: 0
62
+ activate_class_partitioning: true
63
+ use_adapter: true
64
+ adapter_reduce_dim: true
65
 
66
  modules:
67
  compute_stft: !ref <compute_stft>