GaelleLaperriere commited on
Commit
280ff76
1 Parent(s): 27379fb

Create hyperparams.yaml

Browse files
Files changed (1) hide show
  1. hyperparams.yaml +66 -0
hyperparams.yaml ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # ################################
2
+ # Model: Wav2Vec + DNN + CTC + Softmax
3
+ # Authors:
4
+ # Gaelle Laperriere 2023
5
+ # ################################
6
+
7
+ wav2vec_url: LeBenchmark/wav2vec2-FR-3K-large
8
+
9
+ # Feature parameters:
10
+ sample_rate: 16000
11
+ feats_dim: 1024
12
+
13
+ # Model parameters:
14
+ activation: !name:torch.nn.LeakyReLU
15
+ dnn_blocks: 3
16
+ dnn_neurons: 512
17
+
18
+ # Decoding parameters:
19
+ blank_index: 0
20
+
21
+ # Outputs:
22
+ output_neurons: 212
23
+
24
+ # ------ Functions and classes
25
+
26
+ wav2vec2: !new:speechbrain.lobes.models.huggingface_wav2vec.HuggingFaceWav2Vec2
27
+ source: !ref <wav2vec_url>
28
+ output_norm: True
29
+ freeze: True
30
+ save_path: wav2vec2_checkpoint
31
+
32
+ enc: !new:speechbrain.lobes.models.VanillaNN.VanillaNN
33
+ input_shape: [null, null, !ref <feats_dim>]
34
+ activation: !ref <activation>
35
+ dnn_blocks: !ref <dnn_blocks>
36
+ dnn_neurons: !ref <dnn_neurons>
37
+
38
+ output_lin: !new:speechbrain.nnet.linear.Linear
39
+ input_size: !ref <dnn_neurons>
40
+ n_neurons: !ref <output_neurons>
41
+ bias: True
42
+
43
+ log_softmax: !new:speechbrain.nnet.activations.Softmax
44
+ apply_log: True
45
+
46
+ ctc_cost: !name:speechbrain.nnet.losses.ctc_loss
47
+ blank_index: !ref <blank_index>
48
+
49
+ model: !new:torch.nn.ModuleList
50
+ - [!ref <enc>, !ref <output_lin>]
51
+
52
+ encoder:
53
+ wav2vec2: !ref <wav2vec2>
54
+ enc: !ref <enc>
55
+ output_lin: !ref <output_lin>
56
+
57
+ decoding_function: !name:speechbrain.decoders.ctc_greedy_decode
58
+ blank_id: !ref <blank_index>
59
+
60
+ modules:
61
+ encoder: !ref <encoder>
62
+
63
+ pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
64
+ loadables:
65
+ wav2vec2: !ref <wav2vec2>
66
+ model: !ref <model>