Training in progress, epoch 3

Files changed (7) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a7c9ecfd8cb0e06bed2cac1481c181a5f5806b9fbb515be84dd43196c51028d7
 size 721661957

 version https://git-lfs.github.com/spec/v1
+oid sha256:c6b2aa8d5ecf76432f05f192ff200fb716fa8c78842680632b5770377aeb114a
 size 721661957

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:277228f7704eb9c2030d52a5e32186caa0e78367a08ec5637af6d3bdaf2272a8
 size 377646433

 version https://git-lfs.github.com/spec/v1
+oid sha256:459065713e825f184f3249a51b1cb1fdcf8c4e55d65360afde852d992639e851
 size 377646433

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:28ae1a2ba23ced9a3c01553e9871d4c80b2fa566d38f5b037e8bad7cad979aa1
 size 14639

 version https://git-lfs.github.com/spec/v1
+oid sha256:776a1ffc7ef953e1d194b3c21ab858fead4f972f57a0b06bf2e4701dffb4d441
 size 14639

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6aa6b07303f228edfba2736d5f036cc1b3f8047a6cbf3bc89bdceff6f9b1a850
 size 557

 version https://git-lfs.github.com/spec/v1
+oid sha256:cbeff4b41d7db09fb8142adc42392e017e3a3c51c8c7e46d04b5fa617f53bfb3
 size 557

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:47e741874f800d6c85d0ad4fac0bcbd8bbe385fe10b357506f204fa594702563
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:29a1ea701475afc9177572549048e0d86de191233089e775d17466cee30267ad
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.0,
-  "global_step": 8540,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -40,11 +40,28 @@
       "eval_samples_per_second": 24.979,
       "eval_steps_per_second": 3.212,
       "step": 8540
     }
   ],
   "max_steps": 64050,
   "num_train_epochs": 15,
-  "total_flos": 6.465255166176154e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 3.0,
+  "global_step": 12810,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 24.979,
       "eval_steps_per_second": 3.212,
       "step": 8540
+    },
+    {
+      "epoch": 3.0,
+      "learning_rate": 8.422626873520904e-05,
+      "loss": 0.6119,
+      "step": 12810
+    },
+    {
+      "epoch": 3.0,
+      "eval_cer": 0.15064935064935064,
+      "eval_loss": 0.8806686997413635,
+      "eval_new_wer": 0.12380952380952381,
+      "eval_old_wer": 0.2904761904761905,
+      "eval_runtime": 8.4758,
+      "eval_samples_per_second": 24.776,
+      "eval_steps_per_second": 3.186,
+      "step": 12810
     }
   ],
   "max_steps": 64050,
   "num_train_epochs": 15,
+  "total_flos": 9.70374678984573e+18,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:277228f7704eb9c2030d52a5e32186caa0e78367a08ec5637af6d3bdaf2272a8
 size 377646433

 version https://git-lfs.github.com/spec/v1
+oid sha256:459065713e825f184f3249a51b1cb1fdcf8c4e55d65360afde852d992639e851
 size 377646433