Training in progress, step 150000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:27aa7f64a5668997df91945c7aa7132d08b2680aaa25cff1f1eb6757be6962d1
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:340c057c14851ae833de3cc710450e92f28b73faba3e6e2b797775c590c9112f
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e29202b72e61f42c98bc25f38f94ee98f77b85c4c4bbb0df8266a8f3f8636208
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:ed3477a9cbd8106a26fce5dc6885670b82a628ff97f5f44a25b28c6803baa0b7
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bebfad7a42fafd0d6329fb78b3b96185038870b68e01ba3866bf4bcbf7fadf51
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:78bfcdc5f8d31603c243202ea2e17ab1950c927dc5c5016fae62b983ebe9e1e1
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d162d01ddde70767c9bd5e336a2499ccf3d2396e7d0b7bd1aba9c1d926c83412
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:ddbbbcc0085c3c3412d4ad08f1489a0e2b5ac8e2c094ba1211fb11dee05d5e38
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d1534c814ec2aa6d32a209f8a0be527741a8fd36e30d675e3804369bc95727fb
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:c129f476dc2862f36a419e15a11aed6247ca6f392bcfb1f0e011d6fd682b02d0
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c493cb7808c8c84c1bd1c4ad27d29f6c3927fd2c0837f8164a91bfa81d20be30
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:eff4296aefa46c24bf3575f40d88d08cfe8b434da2fa9f20d5131da4319a6071
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:075e346807569ede9b90b05bbb65e7966f610fc696d43bda85981de735e64f8e
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:602374283a35c3573b57bcdea4b872e46b2c01ee008a17814427fffa842d87fa
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b40afc71d1da5a92824e2304336140e2b33816aaeeea8304b470df2b5a3f51c5
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:7e39b8e2ce44c4392d7d60aaf96fb597369284a27e068da332c89dde5d5e7950
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.468081122713849,
-  "global_step": 145000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1746,6 +1746,66 @@
       "learning_rate": 0.00012292364754923295,
       "loss": 0.3444,
       "step": 145000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.5531867813890945,
+  "global_step": 150000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00012292364754923295,
       "loss": 0.3444,
       "step": 145000
+    },
+    {
+      "epoch": 2.48,
+      "learning_rate": 0.0001227497209833376,
+      "loss": 0.3441,
+      "step": 145500
+    },
+    {
+      "epoch": 2.49,
+      "learning_rate": 0.00012257572161186733,
+      "loss": 0.3439,
+      "step": 146000
+    },
+    {
+      "epoch": 2.49,
+      "learning_rate": 0.00012240095376042992,
+      "loss": 0.3436,
+      "step": 146500
+    },
+    {
+      "epoch": 2.5,
+      "learning_rate": 0.00012222576742869685,
+      "loss": 0.3434,
+      "step": 147000
+    },
+    {
+      "epoch": 2.51,
+      "learning_rate": 0.00012205016434568649,
+      "loss": 0.3434,
+      "step": 147500
+    },
+    {
+      "epoch": 2.52,
+      "learning_rate": 0.00012187414624453037,
+      "loss": 0.3433,
+      "step": 148000
+    },
+    {
+      "epoch": 2.53,
+      "learning_rate": 0.00012169771486245609,
+      "loss": 0.3429,
+      "step": 148500
+    },
+    {
+      "epoch": 2.54,
+      "learning_rate": 0.00012152087194077019,
+      "loss": 0.3429,
+      "step": 149000
+    },
+    {
+      "epoch": 2.54,
+      "learning_rate": 0.00012134361922484087,
+      "loss": 0.3435,
+      "step": 149500
+    },
+    {
+      "epoch": 2.55,
+      "learning_rate": 0.0001211659584640809,
+      "loss": 0.3427,
+      "step": 150000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e29202b72e61f42c98bc25f38f94ee98f77b85c4c4bbb0df8266a8f3f8636208
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:ed3477a9cbd8106a26fce5dc6885670b82a628ff97f5f44a25b28c6803baa0b7
 size 201355195