speechbrain
/

whisper_rescuespeech

Automatic Speech Recognition

hf-asr-leaderboard

Model card Files Files and versions Community

sangeet2020 commited on Jul 1, 2023

Commit

c9a2d6d

•

1 Parent(s): b3e6c6f

formatting

Files changed (2) hide show

config.json +1 -2
hyperparams.yaml +33 -26

config.json CHANGED Viewed

@@ -1,4 +1,3 @@
 {
     "speechbrain_interface": "WhisperASR"
-}

 {
     "speechbrain_interface": "WhisperASR"
+}

hyperparams.yaml CHANGED Viewed

@@ -17,7 +17,7 @@ language: german
 normalized_transcripts: true
 test_only: false # Set it to True if you only want to  do the evaluation
-auto_mix_prec: false
 sample_rate: 16000
 # These values are only used for the searchers.
@@ -31,38 +31,45 @@ bos_index: 50258
 # Decoding parameters
 min_decode_ratio: 0.0
-max_decode_ratio: 1.0
 test_beam_size: 8
 # Model parameters
-freeze_whisper: false
-freeze_encoder_only: false
-freeze_encoder: true
-#
-# Functions and classes
-#
-whisper: &id001 !new:speechbrain.lobes.models.huggingface_whisper.HuggingFaceWhisper
-  source: openai/whisper-large-v2
-  freeze: false
-  save_path: openai/whisper-large-v2
-  encoder_only: false
-  freeze_encoder: true
-modules:
-  whisper: *id001
-whisper_opt_class: !name:torch.optim.AdamW
-  lr: 0.00003
-  weight_decay: 0.01
 decoder: !new:speechbrain.decoders.seq2seq.S2SWhisperGreedySearch
-  model: *id001
-  bos_index: 50363
-  eos_index: 50257
-  min_decode_ratio: 0.0
-  max_decode_ratio: 1.0
-pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
-  loadables:
     whisper: !ref <whisper>

 normalized_transcripts: true
 test_only: false # Set it to True if you only want to  do the evaluation
+auto_mix_prec: False
 sample_rate: 16000
 # These values are only used for the searchers.
 # Decoding parameters
 min_decode_ratio: 0.0
+max_decode_ratio: 0.1
 test_beam_size: 8
 # Model parameters
+freeze_whisper: True
+freeze_encoder: True
+whisper: !new:speechbrain.lobes.models.huggingface_whisper.HuggingFaceWhisper
+    source: !ref <whisper_hub>
+    freeze: !ref <freeze_whisper>
+    freeze_encoder: !ref <freeze_encoder>
+    save_path: whisper_checkpoints
+    encoder_only:  False
 decoder: !new:speechbrain.decoders.seq2seq.S2SWhisperGreedySearch
+    model: !ref <whisper>
+    bos_index: !ref <timestamp_index>
+    eos_index: !ref <eos_index>
+    min_decode_ratio: !ref <min_decode_ratio>
+    max_decode_ratio: !ref <max_decode_ratio>
+# test_beam_searcher: !new:speechbrain.decoders.seq2seq.S2SWhisperBeamSearch
+#     module: [!ref <whisper>]
+#     bos_index: !ref <timestamp_index>
+#     eos_index: !ref <eos_index>
+#     min_decode_ratio: !ref <min_decode_ratio>
+#     max_decode_ratio: !ref <max_decode_ratio>
+#     beam_size: !ref <test_beam_size>
+modules:
     whisper: !ref <whisper>
+    decoder:  !ref <decoder>
+pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
+    loadables:
+        whisper: !ref <whisper>