Training in progress, step 205000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:db0082585963d0779a3f6f845b8a80f0898e8eedf6b822ae1abfa3c565e33123
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:af01b5ca42520bcf619e023d4a16b5298aaa21dec9432e39d57a0c72c202ab9a
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:54fb806d94f7814d043292764ccbf83208093216238755776971fd13549a8417
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:354a0aed676b29ec3760436e5b6c43c03cc9569f889c0b3b60a7749726eff99e
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:02ff42f6c9444191a36be04b13f7af185230adc9bf275d0694e2347ba302132d
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:7e14ecc5beeebc62d444ee2189eaa9cdcc7f712888371458a0734a769c8606f9
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:effaa00a349e084c8da5b94ad9b11caf6487ba546f1186937a88a0177e674c2a
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:3da12d484b890ae8d00ec81f880f5fcabe9fab18446a270662286922b1e88c62
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a8cbaa6dd387c55ef769edc414fe52b33f735df38dad67cd88e3197b2fccab40
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:ccafac50eaf81a2756a49700e4d5786269f5269edf292835f3f910779efbc3a3
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0660ca2210537ad62887c89aee0a6b18f7d33e103b3c25af90e948e70a018db8
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:d5b3f1141ef34f4da98944cd3ac205ef2d95d3e7571bb5e5867c779db9ce0e85
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c04d92b6e9668a995aa67c0fd2cccd57c4af61acd1f14d12f1653f5c4a66c8e5
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:5570cbca9105b2caec7d33a540aca9f5afd3920d293c8c6ddfc4a69132c812c3
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f1aa56a28bbfa690d13bc1188d2e157d2070090a00f8611ce9f5fd886a2b26ea
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:17870ec46d59ea66d97c4e19444a8e5193a2206169a62e6711fb724252fcfe69
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 3.404251878707415,
-  "global_step": 200000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2406,6 +2406,66 @@
       "learning_rate": 0.00010166506882009926,
       "loss": 0.3356,
       "step": 200000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 3.4893575373826606,
+  "global_step": 205000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00010166506882009926,
       "loss": 0.3356,
       "step": 200000
+    },
+    {
+      "epoch": 3.41,
+      "learning_rate": 0.00010145626726491797,
+      "loss": 0.3363,
+      "step": 200500
+    },
+    {
+      "epoch": 3.42,
+      "learning_rate": 0.00010124683571819103,
+      "loss": 0.3363,
+      "step": 201000
+    },
+    {
+      "epoch": 3.43,
+      "learning_rate": 0.00010103719447377321,
+      "loss": 0.3363,
+      "step": 201500
+    },
+    {
+      "epoch": 3.44,
+      "learning_rate": 0.00010082734560073903,
+      "loss": 0.3358,
+      "step": 202000
+    },
+    {
+      "epoch": 3.45,
+      "learning_rate": 0.00010061729117021209,
+      "loss": 0.336,
+      "step": 202500
+    },
+    {
+      "epoch": 3.46,
+      "learning_rate": 0.00010040703325534484,
+      "loss": 0.336,
+      "step": 203000
+    },
+    {
+      "epoch": 3.46,
+      "learning_rate": 0.00010019657393129802,
+      "loss": 0.3359,
+      "step": 203500
+    },
+    {
+      "epoch": 3.47,
+      "learning_rate": 9.998591527522016e-05,
+      "loss": 0.3357,
+      "step": 204000
+    },
+    {
+      "epoch": 3.48,
+      "learning_rate": 9.977505936622718e-05,
+      "loss": 0.3356,
+      "step": 204500
+    },
+    {
+      "epoch": 3.49,
+      "learning_rate": 9.956400828538178e-05,
+      "loss": 0.3358,
+      "step": 205000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:54fb806d94f7814d043292764ccbf83208093216238755776971fd13549a8417
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:354a0aed676b29ec3760436e5b6c43c03cc9569f889c0b3b60a7749726eff99e
 size 201355195