Training in progress, step 253000

Files changed (7) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d90b5ebf06155c70e5daaed08d4546a39daa7266301f513e66d0f15d5d9c2419
 size 174303

 version https://git-lfs.github.com/spec/v1
+oid sha256:388bd495779c635d92b8b205e680b77c3f1bfab35ea510932d89ca31c5ddc44e
 size 174303

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:006603074de6c85bed0b63caa3b4683fd8c57fcc139a2078427be4973258a0ca
 size 377644503

 version https://git-lfs.github.com/spec/v1
+oid sha256:804f5bf7419f8a372aa88b22397e3d90f6fabffb7c4cfdf6488d88770701396b
 size 377644503

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7b8ed9eaeb1d9ab140f4512af9b406c20f1538f4b8c592f9db794da85ff0be0c
-size 14631

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ea70ed9280c12cd12fbcab48baf0f73b6b95b5c739aae22db8aee504cb07a30
+size 14567

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3904f4b3e0aa9dbb4cdd97547b68b0456e4a8a564d2f4160ea6926a391a9084b
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:b4e7fc9cbae8d2a52769f62d26282c6279fa2b6f27e451041ffe84c4854b2d2d
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e219c08226b8a6731a1a132fa7e719ca671984e8d0bd51af0489dd0ee562b55
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:f2ebe698f52b0c8b82a4138a896e5905ffe8f78bfa76ddbb42f4e9d92fc35fc2
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 900.0,
-  "global_step": 227700,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -150,11 +150,27 @@
       "eval_steps_per_second": 26.884,
       "eval_wer": 1.0,
       "step": 227700
     }
   ],
   "max_steps": 253000,
   "num_train_epochs": 1000,
-  "total_flos": 2.104540714316478e+20,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1000.0,
+  "global_step": 253000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_steps_per_second": 26.884,
       "eval_wer": 1.0,
       "step": 227700
+    },
+    {
+      "epoch": 1000.0,
+      "learning_rate": 4.951112960266278e-08,
+      "loss": 2.3067,
+      "step": 253000
+    },
+    {
+      "epoch": 1000.0,
+      "eval_cer": 0.8883116883116883,
+      "eval_loss": 2.9747302532196045,
+      "eval_runtime": 0.6721,
+      "eval_samples_per_second": 208.293,
+      "eval_steps_per_second": 26.781,
+      "eval_wer": 1.0,
+      "step": 253000
     }
   ],
   "max_steps": 253000,
   "num_train_epochs": 1000,
+  "total_flos": 2.3383716160651048e+20,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:006603074de6c85bed0b63caa3b4683fd8c57fcc139a2078427be4973258a0ca
 size 377644503

 version https://git-lfs.github.com/spec/v1
+oid sha256:804f5bf7419f8a372aa88b22397e3d90f6fabffb7c4cfdf6488d88770701396b
 size 377644503