Training in progress, step 1000

Browse files

Files changed (7) hide show

checkpoint-1000/optimizer.pt +1 -1
checkpoint-1000/pytorch_model.bin +1 -1
checkpoint-1000/scaler.pt +1 -1
checkpoint-1000/scheduler.pt +1 -1
checkpoint-1000/trainer_state.json +31 -31
checkpoint-1000/training_args.bin +1 -1
pytorch_model.bin +1 -1

checkpoint-1000/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d0d150bb1a47e890e734324095bdcd55d5623b896320a5e9a0459aa856b42b06
 size 2490362385

 version https://git-lfs.github.com/spec/v1
+oid sha256:b8bbfd4ba575f9da0f10fafd071b49cb2a417b069734ec3f8f25e57b1ace80ce
 size 2490362385

checkpoint-1000/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4aca4a6284adca4d75ba2f01b265d187999f0c8e97b09264b7de0ae8d1cf8e73
 size 1262075377

 version https://git-lfs.github.com/spec/v1
+oid sha256:5413d438578028bae2ac5a1c47311442081ff0b4a1db9b89c2080d69df74655b
 size 1262075377

checkpoint-1000/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7bbf6de402af56dc2b2a14f7e42db0ebd96220f08261d4ff0afbff460336edc5
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:512798d6b261c10f4cf46e1adb2e820c4ee1ce81131c16f70b43feb653238645
 size 559

checkpoint-1000/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1857ca7370610b3ead1d5c1c34b6dfa40788a343fde2e87dcf51cf4b056364d1
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:61c6e8fe2cbf564c32ff5b35a892290556b40ae70bfcf843d4a10850b1b863ed
 size 623

checkpoint-1000/trainer_state.json CHANGED Viewed

@@ -9,85 +9,85 @@
   "log_history": [
     {
       "epoch": 0.29,
-      "learning_rate": 7.151470588235293e-05,
-      "loss": 5.1135,
       "step": 100
     },
     {
       "epoch": 0.58,
-      "learning_rate": 6.710294117647058e-05,
-      "loss": 3.0957,
       "step": 200
     },
     {
       "epoch": 0.87,
-      "learning_rate": 6.269117647058824e-05,
-      "loss": 3.0078,
       "step": 300
     },
     {
       "epoch": 1.16,
-      "learning_rate": 5.827941176470588e-05,
-      "loss": 2.9785,
       "step": 400
     },
     {
       "epoch": 1.45,
-      "learning_rate": 5.3867647058823525e-05,
-      "loss": 2.9069,
       "step": 500
     },
     {
       "epoch": 1.45,
-      "eval_loss": 2.9046826362609863,
-      "eval_runtime": 128.7688,
-      "eval_samples_per_second": 35.878,
-      "eval_steps_per_second": 4.489,
       "eval_wer": 1.0,
       "step": 500
     },
     {
       "epoch": 1.74,
-      "learning_rate": 4.945588235294117e-05,
-      "loss": 2.8537,
       "step": 600
     },
     {
       "epoch": 2.03,
-      "learning_rate": 4.504411764705882e-05,
-      "loss": 2.7928,
       "step": 700
     },
     {
       "epoch": 2.32,
-      "learning_rate": 4.063235294117647e-05,
-      "loss": 2.6988,
       "step": 800
     },
     {
       "epoch": 2.61,
-      "learning_rate": 3.6220588235294115e-05,
-      "loss": 2.6342,
       "step": 900
     },
     {
       "epoch": 2.91,
-      "learning_rate": 3.180882352941176e-05,
-      "loss": 2.5875,
       "step": 1000
     },
     {
       "epoch": 2.91,
-      "eval_loss": 2.415876865386963,
-      "eval_runtime": 164.5912,
-      "eval_samples_per_second": 28.07,
-      "eval_steps_per_second": 3.512,
-      "eval_wer": 1.199687939790736,
       "step": 1000
     }
   ],
-  "max_steps": 1720,
-  "num_train_epochs": 5,
   "total_flos": 2.9636799545011507e+18,
   "trial_name": null,
   "trial_params": null

   "log_history": [
     {
       "epoch": 0.29,
+      "learning_rate": 3.7125e-06,
+      "loss": 12.2713,
       "step": 100
     },
     {
       "epoch": 0.58,
+      "learning_rate": 7.4625e-06,
+      "loss": 6.2026,
       "step": 200
     },
     {
       "epoch": 0.87,
+      "learning_rate": 1.1212499999999998e-05,
+      "loss": 4.1374,
       "step": 300
     },
     {
       "epoch": 1.16,
+      "learning_rate": 1.49625e-05,
+      "loss": 3.6755,
       "step": 400
     },
     {
       "epoch": 1.45,
+      "learning_rate": 1.8712499999999997e-05,
+      "loss": 3.3332,
       "step": 500
     },
     {
       "epoch": 1.45,
+      "eval_loss": 3.292029857635498,
+      "eval_runtime": 137.2974,
+      "eval_samples_per_second": 33.65,
+      "eval_steps_per_second": 4.21,
       "eval_wer": 1.0,
       "step": 500
     },
     {
       "epoch": 1.74,
+      "learning_rate": 2.2462499999999997e-05,
+      "loss": 3.1418,
       "step": 600
     },
     {
       "epoch": 2.03,
+      "learning_rate": 2.6212499999999997e-05,
+      "loss": 3.0879,
       "step": 700
     },
     {
       "epoch": 2.32,
+      "learning_rate": 2.99625e-05,
+      "loss": 3.0216,
       "step": 800
     },
     {
       "epoch": 2.61,
+      "learning_rate": 3.37125e-05,
+      "loss": 2.9595,
       "step": 900
     },
     {
       "epoch": 2.91,
+      "learning_rate": 3.7462499999999996e-05,
+      "loss": 2.9269,
       "step": 1000
     },
     {
       "epoch": 2.91,
+      "eval_loss": 2.941540241241455,
+      "eval_runtime": 178.4388,
+      "eval_samples_per_second": 25.891,
+      "eval_steps_per_second": 3.239,
+      "eval_wer": 0.9966346448020559,
       "step": 1000
     }
   ],
+  "max_steps": 17200,
+  "num_train_epochs": 50,
   "total_flos": 2.9636799545011507e+18,
   "trial_name": null,
   "trial_params": null

checkpoint-1000/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1208f22bb7e06e1e9a51692db0520fbddfc3640941d51dfe45ba3188ada2ecbf
 size 2991

 version https://git-lfs.github.com/spec/v1
+oid sha256:5a168f126d02648193e16ba893c3e1ef9f2c2de91803928caf5e25532aff1325
 size 2991

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ff113c93cbec054547814830ddbe3b7e8b56d08002f35055cf5facbab2743f16
 size 1262075377

 version https://git-lfs.github.com/spec/v1
+oid sha256:5413d438578028bae2ac5a1c47311442081ff0b4a1db9b89c2080d69df74655b
 size 1262075377