Training in progress, step 500

Browse files

Files changed (14) hide show

config.json +42 -0
last-checkpoint/config.json +42 -0
last-checkpoint/optimizer.pt +3 -0
last-checkpoint/preprocessor_config.json +0 -0
last-checkpoint/pytorch_model.bin +3 -0
last-checkpoint/rng_state.pth +3 -0
last-checkpoint/scaler.pt +3 -0
last-checkpoint/scheduler.pt +3 -0
last-checkpoint/trainer_state.json +37 -0
last-checkpoint/training_args.bin +3 -0
pytorch_model.bin +3 -0
runs/Dec07_10-13-58_5b012053c450/1670408086.057574/events.out.tfevents.1670408086.5b012053c450.76.1 +0 -0
runs/Dec07_10-13-58_5b012053c450/events.out.tfevents.1670408086.5b012053c450.76.0 +3 -0
training_args.bin +3 -0

config.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+  "_name_or_path": "openai/whisper-small",
+  "activation_dropout": 0.0,
+  "activation_function": "gelu",
+  "architectures": [
+    "WhisperForConditionalGeneration"
+  ],
+  "attention_dropout": 0.0,
+  "begin_suppress_tokens": [
+    220,
+    50257
+  ],
+  "bos_token_id": 50257,
+  "d_model": 768,
+  "decoder_attention_heads": 12,
+  "decoder_ffn_dim": 3072,
+  "decoder_layerdrop": 0.0,
+  "decoder_layers": 12,
+  "decoder_start_token_id": 50258,
+  "dropout": 0.0,
+  "encoder_attention_heads": 12,
+  "encoder_ffn_dim": 3072,
+  "encoder_layerdrop": 0.0,
+  "encoder_layers": 12,
+  "eos_token_id": 50257,
+  "forced_decoder_ids": null,
+  "init_std": 0.02,
+  "is_encoder_decoder": true,
+  "max_length": 448,
+  "max_source_positions": 1500,
+  "max_target_positions": 448,
+  "model_type": "whisper",
+  "num_hidden_layers": 12,
+  "num_mel_bins": 80,
+  "pad_token_id": 50257,
+  "scale_embedding": false,
+  "suppress_tokens": [],
+  "torch_dtype": "float32",
+  "transformers_version": "4.26.0.dev0",
+  "use_cache": true,
+  "vocab_size": 51865
+}

last-checkpoint/config.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+  "_name_or_path": "openai/whisper-small",
+  "activation_dropout": 0.0,
+  "activation_function": "gelu",
+  "architectures": [
+    "WhisperForConditionalGeneration"
+  ],
+  "attention_dropout": 0.0,
+  "begin_suppress_tokens": [
+    220,
+    50257
+  ],
+  "bos_token_id": 50257,
+  "d_model": 768,
+  "decoder_attention_heads": 12,
+  "decoder_ffn_dim": 3072,
+  "decoder_layerdrop": 0.0,
+  "decoder_layers": 12,
+  "decoder_start_token_id": 50258,
+  "dropout": 0.0,
+  "encoder_attention_heads": 12,
+  "encoder_ffn_dim": 3072,
+  "encoder_layerdrop": 0.0,
+  "encoder_layers": 12,
+  "eos_token_id": 50257,
+  "forced_decoder_ids": null,
+  "init_std": 0.02,
+  "is_encoder_decoder": true,
+  "max_length": 448,
+  "max_source_positions": 1500,
+  "max_target_positions": 448,
+  "model_type": "whisper",
+  "num_hidden_layers": 12,
+  "num_mel_bins": 80,
+  "pad_token_id": 50257,
+  "scale_embedding": false,
+  "suppress_tokens": [],
+  "torch_dtype": "float32",
+  "transformers_version": "4.26.0.dev0",
+  "use_cache": true,
+  "vocab_size": 51865
+}

last-checkpoint/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d3019d592ac2214bc34c970a13e858f6a548e2f3c6a8529ed995697d3017ddf2
+size 1934158597

last-checkpoint/preprocessor_config.json ADDED Viewed

The diff for this file is too large to render. See raw diff

last-checkpoint/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0db5428df45748f5cef71a46ba6d813033461045b670de58e60a0d04c73f3187
+size 967099139

last-checkpoint/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91df483d76db818e32264a4bed794781b8c0596f68ba0c37ccc0e11599204a99
+size 14439

last-checkpoint/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:260a33848ea3e9ae911e570cae9bcabce5ca488fc1c8b3df9ab2ca3c3443394c
+size 559

last-checkpoint/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:016fe8e8a044cb8b996a30294312b233b45f5a8658dbff1e6856e6b8a5f831c6
+size 623

last-checkpoint/trainer_state.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "best_metric": 23.903632599284773,
+  "best_model_checkpoint": "drive/MyDrive/whisper-small-sv/checkpoint-500",
+  "epoch": 0.6468305304010349,
+  "global_step": 500,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.32,
+      "learning_rate": 4.92e-06,
+      "loss": 1.683,
+      "step": 250
+    },
+    {
+      "epoch": 0.65,
+      "learning_rate": 9.920000000000002e-06,
+      "loss": 0.326,
+      "step": 500
+    },
+    {
+      "epoch": 0.65,
+      "eval_loss": 0.32677161693573,
+      "eval_runtime": 2129.4049,
+      "eval_samples_per_second": 2.38,
+      "eval_steps_per_second": 0.298,
+      "eval_wer": 23.903632599284773,
+      "step": 500
+    }
+  ],
+  "max_steps": 4000,
+  "num_train_epochs": 6,
+  "total_flos": 2.30868320256e+18,
+  "trial_name": null,
+  "trial_params": null
+}

last-checkpoint/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:94e1db512506afa070e85c2110e25009481ea0e30add79b38ed7e6b55384b1f1
+size 3567

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0db5428df45748f5cef71a46ba6d813033461045b670de58e60a0d04c73f3187
+size 967099139

runs/Dec07_10-13-58_5b012053c450/1670408086.057574/events.out.tfevents.1670408086.5b012053c450.76.1 CHANGED Viewed

Binary files a/runs/Dec07_10-13-58_5b012053c450/1670408086.057574/events.out.tfevents.1670408086.5b012053c450.76.1 and b/runs/Dec07_10-13-58_5b012053c450/1670408086.057574/events.out.tfevents.1670408086.5b012053c450.76.1 differ

runs/Dec07_10-13-58_5b012053c450/events.out.tfevents.1670408086.5b012053c450.76.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8f36c0674570e3ff7d5abd65d722c847cc6ea5e9d73730d2064e007f6ba79aa6
+size 4906

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:94e1db512506afa070e85c2110e25009481ea0e30add79b38ed7e6b55384b1f1
+size 3567