lorenlugosch
commited on
Commit
•
876b26c
1
Parent(s):
57434fc
remove more training stuff
Browse files- hyperparams.yaml +0 -34
hyperparams.yaml
CHANGED
@@ -8,8 +8,6 @@
|
|
8 |
# Authors: Loren Lugosch, Mirco Ravanelli 2020
|
9 |
# ############################################################################
|
10 |
|
11 |
-
token_type: unigram # ["unigram", "bpe", "char"]
|
12 |
-
|
13 |
# Model parameters
|
14 |
sample_rate: 16000
|
15 |
emb_size: 128
|
@@ -75,11 +73,8 @@ model: !new:torch.nn.ModuleList
|
|
75 |
tokenizer: !new:sentencepiece.SentencePieceProcessor
|
76 |
|
77 |
pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
|
78 |
-
collect_in: !ref <save_folder>/TAS_tokenizer
|
79 |
loadables:
|
80 |
tokenizer: !ref <tokenizer>
|
81 |
-
paths:
|
82 |
-
tokenizer: !ref <tokenizer_file>
|
83 |
|
84 |
beam_searcher: !new:speechbrain.decoders.S2SRNNBeamSearcher
|
85 |
embedding: !ref <output_emb>
|
@@ -96,36 +91,7 @@ beam_searcher: !new:speechbrain.decoders.S2SRNNBeamSearcher
|
|
96 |
max_attn_shift: 30
|
97 |
coverage_penalty: 0.
|
98 |
|
99 |
-
opt_class: !name:torch.optim.Adam
|
100 |
-
lr: !ref <lr>
|
101 |
-
|
102 |
-
lr_annealing: !new:speechbrain.nnet.schedulers.NewBobScheduler
|
103 |
-
initial_value: !ref <lr>
|
104 |
-
improvement_threshold: 0.0025
|
105 |
-
annealing_factor: 0.8
|
106 |
-
patient: 0
|
107 |
-
|
108 |
-
checkpointer: !new:speechbrain.utils.checkpoints.Checkpointer
|
109 |
-
checkpoints_dir: !ref <save_folder>
|
110 |
-
recoverables:
|
111 |
-
model: !ref <model>
|
112 |
-
scheduler: !ref <lr_annealing>
|
113 |
-
counter: !ref <epoch_counter>
|
114 |
-
|
115 |
-
augmentation: !new:speechbrain.lobes.augment.TimeDomainSpecAugment
|
116 |
-
sample_rate: !ref <sample_rate>
|
117 |
-
speeds: [95, 100, 105]
|
118 |
-
|
119 |
log_softmax: !new:speechbrain.nnet.activations.Softmax
|
120 |
apply_log: True
|
121 |
|
122 |
-
seq_cost: !name:speechbrain.nnet.losses.nll_loss
|
123 |
-
label_smoothing: 0.1
|
124 |
-
|
125 |
-
train_logger: !new:speechbrain.utils.train_logger.FileTrainLogger
|
126 |
-
save_file: !ref <train_log>
|
127 |
-
|
128 |
-
error_rate_computer: !name:speechbrain.utils.metric_stats.ErrorRateStats
|
129 |
|
130 |
-
cer_computer: !name:speechbrain.utils.metric_stats.ErrorRateStats
|
131 |
-
split_tokens: True
|
|
|
8 |
# Authors: Loren Lugosch, Mirco Ravanelli 2020
|
9 |
# ############################################################################
|
10 |
|
|
|
|
|
11 |
# Model parameters
|
12 |
sample_rate: 16000
|
13 |
emb_size: 128
|
|
|
73 |
tokenizer: !new:sentencepiece.SentencePieceProcessor
|
74 |
|
75 |
pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
|
|
|
76 |
loadables:
|
77 |
tokenizer: !ref <tokenizer>
|
|
|
|
|
78 |
|
79 |
beam_searcher: !new:speechbrain.decoders.S2SRNNBeamSearcher
|
80 |
embedding: !ref <output_emb>
|
|
|
91 |
max_attn_shift: 30
|
92 |
coverage_penalty: 0.
|
93 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
94 |
log_softmax: !new:speechbrain.nnet.activations.Softmax
|
95 |
apply_log: True
|
96 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
97 |
|
|
|
|