Training in progress, step 400000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8badaf858040e9a408943a6e9fbd7b673381f667c74f44da38b93b7faa806cd6
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:935482101098fd1bcdba8ff4db7e80c3829f3028494140828e0a94cd2691c2d8
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a7e0679255ea6b36201b0d808a362cef9e0cc4250bf2a27a7d227fb77c38b5a3
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:8bf63b57e9c92ad51945b78dcd295810ddc94ae491f8c80e57b169bae7716317
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:321f848c05abd7bede59850502e9582f8a2efa51300e70f7c4e42416383b1f9d
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:325753cffb70e35308b5d9f5fd9d5f81e4abc5575cc397e717b388a32e603120
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7173cab8fec53de370fc776b8ec60abd28823c70815e5aae8f471b1d4cd8593a
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:b0a5f6b1461ae68dec64360dd3e057905146ceae77ab814e4a2b5b43cca29a7d
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9bbf3b61889bf57772bca69e3fa2b3a58e51beabaa460befd9b8ff1bc01f45da
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:5791c011f9c77cc08334bc5642cc18df6e799e70037d743754cc941773ed51bd
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:053726ed745fa923b4c9b6b87c5501b19122cc00993e8b017178f10a7f218f5b
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:33d463e038379047a89525a90e8d432deeb676fbca369621cedef5ebd2be17cc
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:062ee8ab98f80273aee87dab235a0bc7258dc420c22cabc1af7c5b580c42129d
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:6e8834f32b5068af02b0ae35e7bc2e78bf21aef2c72704751d0c45945323a934
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:09de475ccd38f92b9bb28c41a7de8a4a2d4763ec7818473a0c7e4d4586d6efeb
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:c579cbfbdb05c1d3520e249d34e85627c452e7287efcbb543d8b7d39834bb0fc
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 6.723398098739585,
-  "global_step": 395000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -4746,6 +4746,66 @@
       "learning_rate": 2.473041898715981e-05,
       "loss": 0.3201,
       "step": 395000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 6.80850375741483,
+  "global_step": 400000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.473041898715981e-05,
       "loss": 0.3201,
       "step": 395000
+    },
+    {
+      "epoch": 6.73,
+      "learning_rate": 2.459600848399211e-05,
+      "loss": 0.3203,
+      "step": 395500
+    },
+    {
+      "epoch": 6.74,
+      "learning_rate": 2.4462142610782094e-05,
+      "loss": 0.3203,
+      "step": 396000
+    },
+    {
+      "epoch": 6.75,
+      "learning_rate": 2.4328556058264563e-05,
+      "loss": 0.3203,
+      "step": 396500
+    },
+    {
+      "epoch": 6.76,
+      "learning_rate": 2.419551896042324e-05,
+      "loss": 0.3201,
+      "step": 397000
+    },
+    {
+      "epoch": 6.77,
+      "learning_rate": 2.4063032630280625e-05,
+      "loss": 0.3201,
+      "step": 397500
+    },
+    {
+      "epoch": 6.77,
+      "learning_rate": 2.3931098375423278e-05,
+      "loss": 0.3203,
+      "step": 398000
+    },
+    {
+      "epoch": 6.78,
+      "learning_rate": 2.3799717497989015e-05,
+      "loss": 0.3202,
+      "step": 398500
+    },
+    {
+      "epoch": 6.79,
+      "learning_rate": 2.3668891294654094e-05,
+      "loss": 0.3199,
+      "step": 399000
+    },
+    {
+      "epoch": 6.8,
+      "learning_rate": 2.3538621056620283e-05,
+      "loss": 0.3202,
+      "step": 399500
+    },
+    {
+      "epoch": 6.81,
+      "learning_rate": 2.340890806960229e-05,
+      "loss": 0.3201,
+      "step": 400000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a7e0679255ea6b36201b0d808a362cef9e0cc4250bf2a27a7d227fb77c38b5a3
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:8bf63b57e9c92ad51945b78dcd295810ddc94ae491f8c80e57b169bae7716317
 size 201355195