test

Files changed (8) hide show

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ checkpoint-*/

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "openai/whisper-base",
   "activation_dropout": 0.0,
   "activation_function": "gelu",
   "architectures": [
@@ -11,17 +11,17 @@
     50257
   ],
   "bos_token_id": 50257,
-  "d_model": 512,
-  "decoder_attention_heads": 8,
-  "decoder_ffn_dim": 2048,
   "decoder_layerdrop": 0.0,
-  "decoder_layers": 6,
   "decoder_start_token_id": 50258,
   "dropout": 0.0,
-  "encoder_attention_heads": 8,
-  "encoder_ffn_dim": 2048,
   "encoder_layerdrop": 0.0,
-  "encoder_layers": 6,
   "eos_token_id": 50257,
   "forced_decoder_ids": null,
   "init_std": 0.02,
@@ -30,7 +30,7 @@
   "max_source_positions": 1500,
   "max_target_positions": 448,
   "model_type": "whisper",
-  "num_hidden_layers": 6,
   "num_mel_bins": 80,
   "pad_token_id": 50257,
   "scale_embedding": false,

 {
+  "_name_or_path": "openai/whisper-small",
   "activation_dropout": 0.0,
   "activation_function": "gelu",
   "architectures": [
     50257
   ],
   "bos_token_id": 50257,
+  "d_model": 768,
+  "decoder_attention_heads": 12,
+  "decoder_ffn_dim": 3072,
   "decoder_layerdrop": 0.0,
+  "decoder_layers": 12,
   "decoder_start_token_id": 50258,
   "dropout": 0.0,
+  "encoder_attention_heads": 12,
+  "encoder_ffn_dim": 3072,
   "encoder_layerdrop": 0.0,
+  "encoder_layers": 12,
   "eos_token_id": 50257,
   "forced_decoder_ids": null,
   "init_std": 0.02,
   "max_source_positions": 1500,
   "max_target_positions": 448,
   "model_type": "whisper",
+  "num_hidden_layers": 12,
   "num_mel_bins": 80,
   "pad_token_id": 50257,
   "scale_embedding": false,

run.sh CHANGED Viewed

@@ -7,8 +7,9 @@ python run_speech_recognition_seq2seq_streaming.py \
 	--model_index_name="Whisper Base Norwegian" \
 	--max_steps="5000" \
 	--output_dir="./" \
-	--per_device_train_batch_size="32" \
 	--per_device_eval_batch_size="32" \
 	--logging_steps="50" \
 	--learning_rate="1e-5" \
 	--warmup_steps="500" \

 	--model_index_name="Whisper Base Norwegian" \
 	--max_steps="5000" \
 	--output_dir="./" \
+	--per_device_train_batch_size="128" \
 	--per_device_eval_batch_size="32" \
+	--lr_scheduler_type="constant_with_warmup" \
 	--logging_steps="50" \
 	--learning_rate="1e-5" \
 	--warmup_steps="500" \

runs/Dec12_08-40-23_dante/1670830840.7423093/events.out.tfevents.1670830840.dante.3225009.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:12be5a23fd4a55847c306828d1be0539264b86d9f4593d61be6d348257d9d750
+size 5696

runs/Dec12_08-40-23_dante/events.out.tfevents.1670830840.dante.3225009.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a6a07b5fec751b76dd400ecbc88406ceb42568f47d56ca489f8782f18124ac1a
+size 4165

runs/Dec12_08-47-16_dante/1670831255.707328/events.out.tfevents.1670831255.dante.3230904.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef5197970336869de45d32e740b8c808fd4cfdd5b56c520df13d54ebb0906c0e
+size 5857

runs/Dec12_08-47-16_dante/events.out.tfevents.1670831255.dante.3230904.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:839afafd6ddf575063388fad3b55544ae380474f898dfcafcfd8a7814fd559c4
+size 4254

tokenizer_config.json CHANGED Viewed

@@ -18,8 +18,8 @@
     "single_word": false
   },
   "errors": "replace",
-  "model_max_length": 448,
-  "name_or_path": "openai/whisper-base",
   "pad_token": null,
   "processor_class": "WhisperProcessor",
   "return_attention_mask": false,

     "single_word": false
   },
   "errors": "replace",
+  "model_max_length": 1024,
+  "name_or_path": "openai/whisper-small",
   "pad_token": null,
   "processor_class": "WhisperProcessor",
   "return_attention_mask": false,