Training in progress, step 475000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ca77a5dbd8026f76af848254207870eb2ccd175c0dee4a8c0fee44891a87588e
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:f630ea11527d197e0051d630a3c7684e04ac097735851914a04564cfa290662a
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d23760072e5a7125a31204d73f6355de96639a56aca3dd44d457dd0c4eb6f41e
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:55a346d3f07ebfee804ae0c4f2dae5d72f27c7b679ca8fdd943dd3fd17b9d683
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:21c75708378bb3a4f0d72676110aa9ff474cd2117cc84f11d618f13edbd722d3
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:52127cd3b69efa84d95e8d727cc591494451ce5ed8828e23e997b43eb36eecb2
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aba69dd8ff4d24bad26948637df922ba7515fea7cf8eb37732b35bd310c4bd05
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:dda55b720bc9bae3b0bf6e8c7ffae8f1314b9ba4095ff7cbc54bd1dfc75c8cc7
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:700ce99772259361623e1887fedad42faf671219e9892827c68ca1bdd62d6c20
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:87be04b3b35410443ebe6570babc429a6b6a3f95c5b0f38bfd1c9c5398abfe0a
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:364d3ce7d0b7d1d3913115fb3dbb4222a2d7297db87154518774c80eff073be5
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:c9f467d9f8afaebc6e44d3fee8e452fbc9bcf86ce65ff48be9ae812a59e27b2c
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0731dd739865cc8a6e81a2a5c07511dd29f52f75cc4568cab5c57bfbd230f902
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:911e6646c31dedcf9cf3679206057244279210182cc9bc754d7e887f4554a86b
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:229f76646f963bb7bb363aeab52140886626dd987202d9c29e3f40f18b9b0846
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:8192356049e5a5cfc33bc765cffbe4a97cbddd7e409ef12d0abda813cadbf6d0
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 7.999991489434133,
-  "global_step": 470000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -5646,6 +5646,66 @@
       "learning_rate": 1.1254771050561826e-05,
       "loss": 0.3186,
       "step": 470000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 8.085105658675245,
+  "global_step": 475000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.1254771050561826e-05,
       "loss": 0.3186,
       "step": 470000
+    },
+    {
+      "epoch": 8.01,
+      "learning_rate": 1.1213740324212508e-05,
+      "loss": 0.3186,
+      "step": 470500
+    },
+    {
+      "epoch": 8.02,
+      "learning_rate": 1.117330558594806e-05,
+      "loss": 0.3189,
+      "step": 471000
+    },
+    {
+      "epoch": 8.03,
+      "learning_rate": 1.1133550139371026e-05,
+      "loss": 0.3185,
+      "step": 471500
+    },
+    {
+      "epoch": 8.03,
+      "learning_rate": 1.1094474376851596e-05,
+      "loss": 0.3187,
+      "step": 472000
+    },
+    {
+      "epoch": 8.04,
+      "learning_rate": 1.1056154796474798e-05,
+      "loss": 0.3186,
+      "step": 472500
+    },
+    {
+      "epoch": 8.05,
+      "learning_rate": 1.1018438191073521e-05,
+      "loss": 0.3187,
+      "step": 473000
+    },
+    {
+      "epoch": 8.06,
+      "learning_rate": 1.0981475797706187e-05,
+      "loss": 0.3186,
+      "step": 473500
+    },
+    {
+      "epoch": 8.07,
+      "learning_rate": 1.0945191867295903e-05,
+      "loss": 0.3186,
+      "step": 474000
+    },
+    {
+      "epoch": 8.08,
+      "learning_rate": 1.0909516085370731e-05,
+      "loss": 0.3186,
+      "step": 474500
+    },
+    {
+      "epoch": 8.09,
+      "learning_rate": 1.0874522198628832e-05,
+      "loss": 0.3185,
+      "step": 475000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d23760072e5a7125a31204d73f6355de96639a56aca3dd44d457dd0c4eb6f41e
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:55a346d3f07ebfee804ae0c4f2dae5d72f27c7b679ca8fdd943dd3fd17b9d683
 size 201355195