Training in progress, step 295000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:51b14eff4a4273c6d3b74abfacfc73b884cf9b9b7c89a08f51ead1f04044721d
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:3750ebe1ae2da9f01607daef1cb133b33e971a37e9ce8e1d24eb674160fe4ca0
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d0869ad7d95645188dccb3e4d87a800a424ce412e68cf67a7641e510484c467e
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:2ac4829037cd81943e3821ef74a6801cc24dc1fa1d45cc60ec3587e504efaac1
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:12b3f1f4ef7d54ab74f08b6a6f7af18fc022998fa9e7e56e07868a564d491d66
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:3100e1f748b9c8003b83deeae985130a3ecb14b2cdba4bc463eb75df5150d5f3
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9135594bbb586f075b7638cecd4126fb3316150a75a6fdf73a4dbcbfa23edf9f
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:f63bff5bb77e4674cbdfea1305ba8b8680e73189bd93865f89ea62c792263704
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:36e6eeeb63a7d5efe3d89e51c42e86fbccb201f0a76f81a39558ea2786f8b6a1
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:8b7134061263ea454a3d6008a2221f1728c1d3633dff4b7eeed6b2beff5d4c9f
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:43d15bd14eb8428e51e4855f72917c2a4075d4c0c1aa4a9dd827fec888eb9fd9
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:b8ed60e7003523f0c6427f971a8de5ddba4b001d4fd30e1ced45db1a7d82e7e5
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1e94f3f55189c88e8c606f8b356b8d855b941bd1572eb843a4126c797cf5f785
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:13e1aa031e346cfe6be393d14a7fbbf53792c8beb4d208dd0478a21af9fb3ce4
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6efbd14b80e31c442e70702f490a0feb0bba9ae059c89f649541b88541b74c6a
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:13084d5229415d51bec58a80f9ece1ab058e32847d6e3120c6b36d493ed74470
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 4.936162245427698,
-  "global_step": 290000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -3486,6 +3486,66 @@
       "learning_rate": 6.264070302791827e-05,
       "loss": 0.3263,
       "step": 290000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 5.021276414668812,
+  "global_step": 295000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 6.264070302791827e-05,
       "loss": 0.3263,
       "step": 290000
+    },
+    {
+      "epoch": 4.94,
+      "learning_rate": 6.242774701957516e-05,
+      "loss": 0.3263,
+      "step": 290500
+    },
+    {
+      "epoch": 4.95,
+      "learning_rate": 6.221496444227476e-05,
+      "loss": 0.3261,
+      "step": 291000
+    },
+    {
+      "epoch": 4.96,
+      "learning_rate": 6.200235739609522e-05,
+      "loss": 0.3261,
+      "step": 291500
+    },
+    {
+      "epoch": 4.97,
+      "learning_rate": 6.179035265954763e-05,
+      "loss": 0.326,
+      "step": 292000
+    },
+    {
+      "epoch": 4.98,
+      "learning_rate": 6.157810260735043e-05,
+      "loss": 0.3261,
+      "step": 292500
+    },
+    {
+      "epoch": 4.99,
+      "learning_rate": 6.136603437184328e-05,
+      "loss": 0.3259,
+      "step": 293000
+    },
+    {
+      "epoch": 5.0,
+      "learning_rate": 6.115457362977345e-05,
+      "loss": 0.3258,
+      "step": 293500
+    },
+    {
+      "epoch": 5.0,
+      "learning_rate": 6.0942874930827204e-05,
+      "loss": 0.326,
+      "step": 294000
+    },
+    {
+      "epoch": 5.01,
+      "learning_rate": 6.0731364318011724e-05,
+      "loss": 0.3256,
+      "step": 294500
+    },
+    {
+      "epoch": 5.02,
+      "learning_rate": 6.052004387885136e-05,
+      "loss": 0.3258,
+      "step": 295000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d0869ad7d95645188dccb3e4d87a800a424ce412e68cf67a7641e510484c467e
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:2ac4829037cd81943e3821ef74a6801cc24dc1fa1d45cc60ec3587e504efaac1
 size 201355195