Training in progress, step 3000

Browse files

Files changed (7) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +84 -3
pytorch_model.bin +1 -1
runs/Apr12_05-50-01_129-159-47-80/events.out.tfevents.1681278622.129-159-47-80.68729.10 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:588d10af448e2bc968a47db13cf54f392be06f9cd285212df059eff45cf2fa0d
 size 302223127

 version https://git-lfs.github.com/spec/v1
+oid sha256:32cef5ab050e632515a0a2aaf3445b5327ddb40735bec95e5a98a5c88722de3e
 size 302223127

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8bb3c2e5fe2e33248d91ddc549145efbe72f18da134c43f3a130bc12fc2791b7
 size 151097331

 version https://git-lfs.github.com/spec/v1
+oid sha256:c7e8cac498b492ce5e234a66e906c5bb4a45ff41a3563056385f45009b84142e
 size 151097331

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0d6b3a7b0d7250afb6790645a395c91193529b5bce0f81403756e2fcd59e249d
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:dfc172c91a14f3a61f00ce1202c6ffe9f6f9e454d5d0e8b9b96f1057561102fb
 size 14503

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:060481cf2a2651fa80909e9664860c4e95fbd3721e7009ca268a507e0a3e6fb6
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:a5a79439619f4b20ecf7c8d20593147464500cb27c3d447ec4f9e2d9cb88ff40
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": 42.17917675544795,
   "best_model_checkpoint": "whisper-tiny-v2-ta_tf32_adamBetas_2/checkpoint-2100",
-  "epoch": 0.9475346552026671,
-  "global_step": 2700,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -735,11 +735,92 @@
       "eval_steps_per_second": 0.835,
       "eval_wer": 43.389830508474574,
       "step": 2700
     }
   ],
   "max_steps": 4000,
   "num_train_epochs": 2,
-  "total_flos": 2.127071674368e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": 42.17917675544795,
   "best_model_checkpoint": "whisper-tiny-v2-ta_tf32_adamBetas_2/checkpoint-2100",
+  "epoch": 1.052816283558519,
+  "global_step": 3000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_steps_per_second": 0.835,
       "eval_wer": 43.389830508474574,
       "step": 2700
+    },
+    {
+      "epoch": 0.96,
+      "learning_rate": 5.464285714285714e-06,
+      "loss": 0.2813,
+      "step": 2725
+    },
+    {
+      "epoch": 0.97,
+      "learning_rate": 5.357142857142857e-06,
+      "loss": 0.2723,
+      "step": 2750
+    },
+    {
+      "epoch": 0.97,
+      "learning_rate": 5.25e-06,
+      "loss": 0.3075,
+      "step": 2775
+    },
+    {
+      "epoch": 0.98,
+      "learning_rate": 5.142857142857143e-06,
+      "loss": 0.29,
+      "step": 2800
+    },
+    {
+      "epoch": 0.99,
+      "learning_rate": 5.035714285714285e-06,
+      "loss": 0.2939,
+      "step": 2825
+    },
+    {
+      "epoch": 1.0,
+      "learning_rate": 4.9285714285714286e-06,
+      "loss": 0.2718,
+      "step": 2850
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 4.821428571428572e-06,
+      "loss": 0.2876,
+      "step": 2875
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 4.714285714285714e-06,
+      "loss": 0.2661,
+      "step": 2900
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 4.6071428571428574e-06,
+      "loss": 0.2742,
+      "step": 2925
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 4.5e-06,
+      "loss": 0.2796,
+      "step": 2950
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 4.392857142857143e-06,
+      "loss": 0.2745,
+      "step": 2975
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 4.2857142857142855e-06,
+      "loss": 0.2717,
+      "step": 3000
+    },
+    {
+      "epoch": 1.05,
+      "eval_loss": 0.3490868806838989,
+      "eval_runtime": 15.5303,
+      "eval_samples_per_second": 6.439,
+      "eval_steps_per_second": 0.837,
+      "eval_wer": 43.14769975786925,
+      "step": 3000
     }
   ],
   "max_steps": 4000,
   "num_train_epochs": 2,
+  "total_flos": 2.36333911486464e+18,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8bb3c2e5fe2e33248d91ddc549145efbe72f18da134c43f3a130bc12fc2791b7
 size 151097331

 version https://git-lfs.github.com/spec/v1
+oid sha256:c7e8cac498b492ce5e234a66e906c5bb4a45ff41a3563056385f45009b84142e
 size 151097331

runs/Apr12_05-50-01_129-159-47-80/events.out.tfevents.1681278622.129-159-47-80.68729.10 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:96344533184767076db486faeb3306156a3c105f3e24ffd49f2374633a4e8a51
-size 24613

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c393ea2a6dc948c7db1f9b9365c73d8079e84ebe79bb9986dbc909620cf258e
+size 26815