Training in progress, step 300000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3750ebe1ae2da9f01607daef1cb133b33e971a37e9ce8e1d24eb674160fe4ca0
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:8e0fdaa95ab3769d07df2ec51220f48b4f0841e4213a25b8b108ae9d6226afa4
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2ac4829037cd81943e3821ef74a6801cc24dc1fa1d45cc60ec3587e504efaac1
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:443e5aa7e996d90b484593947423fcad9e8622bdc24cf5219c910bf081fc9e4d
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3100e1f748b9c8003b83deeae985130a3ecb14b2cdba4bc463eb75df5150d5f3
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:00949b307e65df8e70eaa37baf0faf7e700ae38e102f65265d748363d1e1e7c4
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f63bff5bb77e4674cbdfea1305ba8b8680e73189bd93865f89ea62c792263704
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:c9d6ac70ad3c1fe3d8c8884698b46b9244004811940695c46fa1538a5a5b31d7
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b7134061263ea454a3d6008a2221f1728c1d3633dff4b7eeed6b2beff5d4c9f
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:8a5e462f009c7a4ee06c1f9147b1621f035a4b94b586dd31adf28879a9b99385
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b8ed60e7003523f0c6427f971a8de5ddba4b001d4fd30e1ced45db1a7d82e7e5
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:458d1568c66c2b6e998ac534b4eaa23acfd7b3a602f1f5dabbd94a34b322a8fb
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:13e1aa031e346cfe6be393d14a7fbbf53792c8beb4d208dd0478a21af9fb3ce4
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:36dbb5a5f2343166fdcd4b09f2c157c64ef7e0b97c386ee5912cc0d77f2607ba
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:13084d5229415d51bec58a80f9ece1ab058e32847d6e3120c6b36d493ed74470
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:671bcba81e7f4b7ad88fc97a70ccffd73844d7a00c4684cf55f5df6cd399eaa3
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 5.021276414668812,
-  "global_step": 295000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -3546,6 +3546,66 @@
       "learning_rate": 6.052004387885136e-05,
       "loss": 0.3258,
       "step": 295000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 5.106382073344057,
+  "global_step": 300000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 6.052004387885136e-05,
       "loss": 0.3258,
       "step": 295000
+    },
+    {
+      "epoch": 5.03,
+      "learning_rate": 6.030891569899353e-05,
+      "loss": 0.3259,
+      "step": 295500
+    },
+    {
+      "epoch": 5.04,
+      "learning_rate": 6.009798186218815e-05,
+      "loss": 0.3256,
+      "step": 296000
+    },
+    {
+      "epoch": 5.05,
+      "learning_rate": 5.988724445026701e-05,
+      "loss": 0.3255,
+      "step": 296500
+    },
+    {
+      "epoch": 5.06,
+      "learning_rate": 5.96767055431233e-05,
+      "loss": 0.3255,
+      "step": 297000
+    },
+    {
+      "epoch": 5.06,
+      "learning_rate": 5.946636721869104e-05,
+      "loss": 0.3255,
+      "step": 297500
+    },
+    {
+      "epoch": 5.07,
+      "learning_rate": 5.925665162062394e-05,
+      "loss": 0.3254,
+      "step": 298000
+    },
+    {
+      "epoch": 5.08,
+      "learning_rate": 5.904672027594373e-05,
+      "loss": 0.3254,
+      "step": 298500
+    },
+    {
+      "epoch": 5.09,
+      "learning_rate": 5.8836995731675224e-05,
+      "loss": 0.3254,
+      "step": 299000
+    },
+    {
+      "epoch": 5.1,
+      "learning_rate": 5.862748005771498e-05,
+      "loss": 0.3254,
+      "step": 299500
+    },
+    {
+      "epoch": 5.11,
+      "learning_rate": 5.841817532189814e-05,
+      "loss": 0.3252,
+      "step": 300000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2ac4829037cd81943e3821ef74a6801cc24dc1fa1d45cc60ec3587e504efaac1
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:443e5aa7e996d90b484593947423fcad9e8622bdc24cf5219c910bf081fc9e4d
 size 201355195