Training in progress, step 38700

Files changed (7) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b90011d2030747356ab243f668e84a5dd813f204960fa97a1bf935274f11a803
 size 168299

 version https://git-lfs.github.com/spec/v1
+oid sha256:ab7425f6f20a7e700795a502bde029c251a95fca2aea4432b7393baa13c654e9
 size 168299

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f86f9ac23d2308cf509eb5e521769eabdf0d8a4b824ea80b156041004f368967
 size 377643361

 version https://git-lfs.github.com/spec/v1
+oid sha256:5f4965a601e3ab51ee0d7f8e7247b30f9ce7dc0c1c09760f0388e9a221dd04cf
 size 377643361

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:feef15ec4ce515fcbab946bd8037cd0308c05666800d5c00311d1e4fdac51f3a
 size 14639

 version https://git-lfs.github.com/spec/v1
+oid sha256:177e387800ca8cd2666fa4801257038fdf7622da72486457a4106aa98f35648d
 size 14639

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f39930d350656455f8be027250b427223ffb576afc64ab4dcc543263c6d75623
 size 557

 version https://git-lfs.github.com/spec/v1
+oid sha256:772e1c2f94d336bf774f1e725393354a53abaa80b5474cd301f1e914f8300325
 size 557

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dbda78ab6d8ba86f177ee5af752aca87f153835542a0e61265450aeb804bc33e
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:b570477637a779a81744c28011e555936fb69b232ffad60a4d749f8dae2e00c3
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 125.0,
-  "global_step": 32250,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -86,11 +86,27 @@
       "eval_steps_per_second": 3.359,
       "eval_wer": 0.9952380952380953,
       "step": 32250
     }
   ],
   "max_steps": 64500,
   "num_train_epochs": 250,
-  "total_flos": 3.1000734447391457e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 150.0,
+  "global_step": 38700,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_steps_per_second": 3.359,
       "eval_wer": 0.9952380952380953,
       "step": 32250
+    },
+    {
+      "epoch": 150.0,
+      "learning_rate": 4.213463892288862e-05,
+      "loss": 2.3529,
+      "step": 38700
+    },
+    {
+      "epoch": 150.0,
+      "eval_cer": 0.8545454545454545,
+      "eval_loss": 2.290559768676758,
+      "eval_runtime": 8.0265,
+      "eval_samples_per_second": 26.163,
+      "eval_steps_per_second": 3.364,
+      "eval_wer": 0.9952380952380953,
+      "step": 38700
     }
   ],
   "max_steps": 64500,
   "num_train_epochs": 250,
+  "total_flos": 3.720106427628256e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f86f9ac23d2308cf509eb5e521769eabdf0d8a4b824ea80b156041004f368967
 size 377643361

 version https://git-lfs.github.com/spec/v1
+oid sha256:5f4965a601e3ab51ee0d7f8e7247b30f9ce7dc0c1c09760f0388e9a221dd04cf
 size 377643361