Training in progress, step 180000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d331c12222b80b51d79250ea6098c76472b90be4bc5c1b95d65991917017c62e
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:e00dfb6570e6058a13ab78da8572c823f929678a4417da77916090ee4d4184d7
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:188a8c5d6cc6a340ca48559f2109ceb5056473930bf637b6adf8f022b805db1b
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:be86d2bff33fa6899dcbcbb8c1514ad5ebc34e19a6d45effffd88614d531f8a2
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5da8050f3fec17f0f993422f7c8b9a867de838f9e7f96dff5dc374b416f9e3d4
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:30f8855e289818b480254745c6cad28b0f999810f519eb5a6ff7a0aea3f235bd
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ffad8df29e4048e4b96e70123f756b3ad525206036229ca856f2bc4d48ba756e
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:62e2e5f68f52a3a8726fcf3e0e6d3f44eb7519f8706c2ed8be8ab76a4686fb8a
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c09d2e030ed75376e9c598986eb072883a0dd110ee2e3eb3f6f27c0576b91e0b
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:93ec12a0879b27c92b709a91bfbb990c2d77c5333a9a37e084db0388a27546be
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b2019e6d9402ce5cbaab9baec39e6c5d6ada6535360ac8d7533185c3c59b246f
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:573df7989752c7cf0f2122cd80a79b0e2f80ed5dbccbfe72aa70ea81b7853582
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a787ade8dc62bf8a75e9b5431f03a8969a01237878239d8a82a05b8998d77c3b
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:0b6d639fc9be21ec690ba0f6589e373d572939ddb4c01a4c98a550989e369f97
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ec0bd4652d15557a0929a867fff0e14635cbe144a105685a7b1df5342b007a93
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:9f01adbf075cdc5fa0718f79c0326e3cd028644bccc4e6c2bb8efca7fb627ec8
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.9787150747653213,
-  "global_step": 175000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2106,6 +2106,66 @@
       "learning_rate": 0.00011180676386671593,
       "loss": 0.3389,
       "step": 175000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 3.063829244006434,
+  "global_step": 180000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00011180676386671593,
       "loss": 0.3389,
       "step": 175000
+    },
+    {
+      "epoch": 2.99,
+      "learning_rate": 0.00011161070859032411,
+      "loss": 0.3387,
+      "step": 175500
+    },
+    {
+      "epoch": 3.0,
+      "learning_rate": 0.00011141434132900025,
+      "loss": 0.3385,
+      "step": 176000
+    },
+    {
+      "epoch": 3.0,
+      "learning_rate": 0.00011121805768356343,
+      "loss": 0.339,
+      "step": 176500
+    },
+    {
+      "epoch": 3.01,
+      "learning_rate": 0.00011102107288390457,
+      "loss": 0.3386,
+      "step": 177000
+    },
+    {
+      "epoch": 3.02,
+      "learning_rate": 0.00011082378191878007,
+      "loss": 0.3383,
+      "step": 177500
+    },
+    {
+      "epoch": 3.03,
+      "learning_rate": 0.000110626582228053,
+      "loss": 0.3385,
+      "step": 178000
+    },
+    {
+      "epoch": 3.04,
+      "learning_rate": 0.00011042908147320174,
+      "loss": 0.3391,
+      "step": 178500
+    },
+    {
+      "epoch": 3.05,
+      "learning_rate": 0.00011023128159568977,
+      "loss": 0.339,
+      "step": 179000
+    },
+    {
+      "epoch": 3.06,
+      "learning_rate": 0.00011003278725476702,
+      "loss": 0.3386,
+      "step": 179500
+    },
+    {
+      "epoch": 3.06,
+      "learning_rate": 0.00010983399650235882,
+      "loss": 0.3384,
+      "step": 180000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:188a8c5d6cc6a340ca48559f2109ceb5056473930bf637b6adf8f022b805db1b
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:be86d2bff33fa6899dcbcbb8c1514ad5ebc34e19a6d45effffd88614d531f8a2
 size 201355195