Training in progress, step 175000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:602836472b5e2c722465609242f7a47d056ce7ba46e7a86301fef60ff775ce83
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:d331c12222b80b51d79250ea6098c76472b90be4bc5c1b95d65991917017c62e
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c26aab368e09302dcf13e7d296cef18de072ca0cd67c5e930b7cbc403c13a86d
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:188a8c5d6cc6a340ca48559f2109ceb5056473930bf637b6adf8f022b805db1b
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c05bfeb5e98bce683190574682f813e2a522697190e69ee10bf7a068f93b6976
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:5da8050f3fec17f0f993422f7c8b9a867de838f9e7f96dff5dc374b416f9e3d4
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f01f5f84e3a31f42df04145fae58f6f7b1f4506d8b1fe2fb28025394ec8cb07e
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:ffad8df29e4048e4b96e70123f756b3ad525206036229ca856f2bc4d48ba756e
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:10e21d463f6e7cd0c9117ab55e1ffd1516f0bf98cf844492234460cda5925bd4
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:c09d2e030ed75376e9c598986eb072883a0dd110ee2e3eb3f6f27c0576b91e0b
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6a2d31392d162b7d4d2268dd187329a9f9784b8b62661a5b232ff40ede5f5e92
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:b2019e6d9402ce5cbaab9baec39e6c5d6ada6535360ac8d7533185c3c59b246f
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:92e5f3bbd27916276b7daba9adf7aec1e0ea749af3982c865282b426347aa9a4
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:a787ade8dc62bf8a75e9b5431f03a8969a01237878239d8a82a05b8998d77c3b
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:edb9d0fd6374cceb9b089b55b43f947afaefabbdd3f8ebab7e2dcb2476738627
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:ec0bd4652d15557a0929a867fff0e14635cbe144a105685a7b1df5342b007a93
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.893609416090076,
-  "global_step": 170000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2046,6 +2046,66 @@
       "learning_rate": 0.00011374934798382673,
       "loss": 0.3396,
       "step": 170000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.9787150747653213,
+  "global_step": 175000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00011374934798382673,
       "loss": 0.3396,
       "step": 170000
+    },
+    {
+      "epoch": 2.9,
+      "learning_rate": 0.00011355651779923088,
+      "loss": 0.3393,
+      "step": 170500
+    },
+    {
+      "epoch": 2.91,
+      "learning_rate": 0.00011336335642535168,
+      "loss": 0.3391,
+      "step": 171000
+    },
+    {
+      "epoch": 2.92,
+      "learning_rate": 0.00011316986576861393,
+      "loss": 0.3394,
+      "step": 171500
+    },
+    {
+      "epoch": 2.93,
+      "learning_rate": 0.00011297604773869221,
+      "loss": 0.3395,
+      "step": 172000
+    },
+    {
+      "epoch": 2.94,
+      "learning_rate": 0.00011278229285900902,
+      "loss": 0.3397,
+      "step": 172500
+    },
+    {
+      "epoch": 2.94,
+      "learning_rate": 0.00011258782646982266,
+      "loss": 0.3396,
+      "step": 173000
+    },
+    {
+      "epoch": 2.95,
+      "learning_rate": 0.0001123930384519453,
+      "loss": 0.3392,
+      "step": 173500
+    },
+    {
+      "epoch": 2.96,
+      "learning_rate": 0.00011219793072785603,
+      "loss": 0.3394,
+      "step": 174000
+    },
+    {
+      "epoch": 2.97,
+      "learning_rate": 0.00011200250522318928,
+      "loss": 0.3391,
+      "step": 174500
+    },
+    {
+      "epoch": 2.98,
+      "learning_rate": 0.00011180676386671593,
+      "loss": 0.3389,
+      "step": 175000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c26aab368e09302dcf13e7d296cef18de072ca0cd67c5e930b7cbc403c13a86d
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:188a8c5d6cc6a340ca48559f2109ceb5056473930bf637b6adf8f022b805db1b
 size 201355195