Training in progress, step 65000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fc4b5c38d548341be3fc6afd8378b62fca364b9a262d5e49b6efc3fc65030ea5
 size 402587859

 version https://git-lfs.github.com/spec/v1
+oid sha256:508714af13750110697dcc33ea46fa8c5545e4a94eee6178bdccb17fefcd99b6
 size 402587859

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ee27d0a5d8910b44eff2a0ce02526c87e97539b95bf5d100d30d6d417b3f746f
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:110d606f122187e413df09cf2f8a265ed4dfc0d65ceb886e487897d1c6480c2b
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5b9e46153a153464357c8d7cc6f8af8240f1f9bd785168adecd2070b9a4aeb7f
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:d21af36309ee088c26a278e0de0ae0ae2f4972c410ac6786b526d393ded0505e
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2debf9f408eebd277828e5d3a2c83beeed24c922197846fbb46de266f4c73c50
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:e7ea0fe0b29bea5a2d2fabbca1105b6b1aaa8cbad86b1fc422ee361a528b8ce2
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ce0ffd2b212e3bb97c9d1959bc46c09d8be6d1062b4e9a4863f950b2dc626889
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:c8ddda9abab8cc31fa025268cbb81d6a8c8d8aa990201b862378d198cc478d74
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:10efae63f5e57622a929379da87dd8d685840f8517ee8618d05f88b888c166c2
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:1d21aba50913ad7356ac8eef62498f347ed0dbc65005eea5be26644550e5a47b
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2c5b2d0eac6380d6179c7b005df331b38821e3646464c4f2ddf0b4dc67ec2f03
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:663047b4a0c5f36263512e8d22703fbf5c49fefd0e151ecb448d12f819828b1d
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4618e81b42373dc5f5648c0a2c9f74dfcdbe40964e20a6736201f60748e5ad2a
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:8d13c4a77964966ff3b3d8b42bdcca922b42a79ca9fbc55e99378b908569c6cd
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.0212765957446808,
-  "global_step": 60000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -726,6 +726,66 @@
       "learning_rate": 0.0001450875916909765,
       "loss": 0.3597,
       "step": 60000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.1063829787234043,
+  "global_step": 65000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.0001450875916909765,
       "loss": 0.3597,
       "step": 60000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 0.00014500650464850112,
+      "loss": 0.3599,
+      "step": 60500
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 0.00014492461416110898,
+      "loss": 0.3597,
+      "step": 61000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 0.00014484208289398622,
+      "loss": 0.3597,
+      "step": 61500
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 0.0001447589116616831,
+      "loss": 0.3595,
+      "step": 62000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 0.00014467510128506612,
+      "loss": 0.3592,
+      "step": 62500
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 0.0001445908221251849,
+      "loss": 0.3592,
+      "step": 63000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 0.0001445057372218952,
+      "loss": 0.3589,
+      "step": 63500
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 0.0001444203598262954,
+      "loss": 0.359,
+      "step": 64000
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 0.0001443340050193786,
+      "loss": 0.3585,
+      "step": 64500
+    },
+    {
+      "epoch": 1.11,
+      "learning_rate": 0.000144247015261805,
+      "loss": 0.3586,
+      "step": 65000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ee27d0a5d8910b44eff2a0ce02526c87e97539b95bf5d100d30d6d417b3f746f
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:110d606f122187e413df09cf2f8a265ed4dfc0d65ceb886e487897d1c6480c2b
 size 201355195