Training in progress, step 210000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:af01b5ca42520bcf619e023d4a16b5298aaa21dec9432e39d57a0c72c202ab9a
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:38516ca0517e9c7bd41fc6158ae087a6a134bc2f0dd8c89f13752386bca97a63
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:354a0aed676b29ec3760436e5b6c43c03cc9569f889c0b3b60a7749726eff99e
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:6a63ed5615691b5a4420962dc27128e6f0d4753bfd9410a7b1a6cb622c4acbb5
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7e14ecc5beeebc62d444ee2189eaa9cdcc7f712888371458a0734a769c8606f9
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:5a7b9ac978a897533a1d78caa11e5297f0a94874bb93aaeed60274a7803c253d
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3da12d484b890ae8d00ec81f880f5fcabe9fab18446a270662286922b1e88c62
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:d9cd11c5bacff161047696669bdb8c61b5441b53c0bd485fe06a6c941142e724
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ccafac50eaf81a2756a49700e4d5786269f5269edf292835f3f910779efbc3a3
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:201bf8b89cfe750a906681c70ce5fcc90044ccfff90a7a74d8d20d43f92cd11c
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d5b3f1141ef34f4da98944cd3ac205ef2d95d3e7571bb5e5867c779db9ce0e85
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:927df4b0b2eb7b67c90634dcefcb8439b0df0747bad04d2776fd3935f5b131b8
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5570cbca9105b2caec7d33a540aca9f5afd3920d293c8c6ddfc4a69132c812c3
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:c7065456e80f792ecf63d108cd10a4439c5d10426363e793cec85f5588f73d66
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:17870ec46d59ea66d97c4e19444a8e5193a2206169a62e6711fb724252fcfe69
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:da455c6df82b96f0b604fd8d8cf8c2607892cf7ef66ee8eb4c9f7c2eee60e455
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 3.4893575373826606,
-  "global_step": 205000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2466,6 +2466,66 @@
       "learning_rate": 9.956400828538178e-05,
       "loss": 0.3358,
       "step": 205000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 3.5744631960579056,
+  "global_step": 210000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 9.956400828538178e-05,
       "loss": 0.3358,
       "step": 205000
+    },
+    {
+      "epoch": 3.5,
+      "learning_rate": 9.935318679532955e-05,
+      "loss": 0.3353,
+      "step": 205500
+    },
+    {
+      "epoch": 3.51,
+      "learning_rate": 9.914217506040476e-05,
+      "loss": 0.3356,
+      "step": 206000
+    },
+    {
+      "epoch": 3.51,
+      "learning_rate": 9.893055172104751e-05,
+      "loss": 0.3354,
+      "step": 206500
+    },
+    {
+      "epoch": 3.52,
+      "learning_rate": 9.871874154478737e-05,
+      "loss": 0.3352,
+      "step": 207000
+    },
+    {
+      "epoch": 3.53,
+      "learning_rate": 9.850674662210523e-05,
+      "loss": 0.3349,
+      "step": 207500
+    },
+    {
+      "epoch": 3.54,
+      "learning_rate": 9.829456904530539e-05,
+      "loss": 0.3349,
+      "step": 208000
+    },
+    {
+      "epoch": 3.55,
+      "learning_rate": 9.808263580357464e-05,
+      "loss": 0.3351,
+      "step": 208500
+    },
+    {
+      "epoch": 3.56,
+      "learning_rate": 9.787052480668757e-05,
+      "loss": 0.3352,
+      "step": 209000
+    },
+    {
+      "epoch": 3.57,
+      "learning_rate": 9.76578125405694e-05,
+      "loss": 0.3355,
+      "step": 209500
+    },
+    {
+      "epoch": 3.57,
+      "learning_rate": 9.744535194458411e-05,
+      "loss": 0.3354,
+      "step": 210000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:354a0aed676b29ec3760436e5b6c43c03cc9569f889c0b3b60a7749726eff99e
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:6a63ed5615691b5a4420962dc27128e6f0d4753bfd9410a7b1a6cb622c4acbb5
 size 201355195