Training in progress, step 445000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fc0113f382a306d0a0270cc8535391c33e1b2af74c51de2e1c6e0d4578e71f9c
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:6ddd3c37bd4200e08826b0a91d5f24c4ff7218397da5c07f384461ccffb9cb9a
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4b3d022a38f882829086501961b7aec842ba9d1cefbd1f74a31fb9e986a1e317
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:03b07a4229a48459c79e80fe855bce597db6900e72bddc707e70f6fbfdf9dfe9
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ed98cd2de93fa24e1ee3c183460e1effd6d0ba45b92a42bfec1f09fdd419d79d
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:f36ebe1c0a4a168a3c7f0b3e3add08a4eb2922192e4272ca5261870371aafca2
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:363e1050ee631150a25cc4a6efefa58b6bb8d8306f6480ffc47a3c0e8283d574
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:253da2fe3f872eb2bc3b8f0a902fed4630b5393d1b6eb6c17b44eefb61bc3cd7
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:70b712440aa43dfef04d3a47555cf899fa15b72d21aa9040c97153ccae5f1d3d
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:8d999a91a6cc7ee3d02856a88c102af0111baa8c1942338c39f2ea2e1a438591
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e73f119d26c8a8d8cbe371942faaf6d5f3c3d949f47febc7dbbe088658221663
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:f88aa60029ff1bb0064fa8b9fff446d83665a7596e171fd5c753540b5ef66f9a
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a4e57b8b8ebc2b0b446feb6aa39819ad3fe38c47f0f6f4374fa7a07e55d973d2
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:7330c5c7638e093c49e8abfe8223573d14775e88899da3795fd13f4a889cdc79
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:eb2e2a4fb149e5bebf2830e61019116dbdc715ae62bbe8b853e44388c27574ef
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:32389c0ec049ef4b8ced7f61f25d86b3dbbfb5bec67ce1197c94aeae299a5a2e
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 7.48935753738266,
-  "global_step": 440000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -5286,6 +5286,66 @@
       "learning_rate": 1.4943207748699148e-05,
       "loss": 0.3192,
       "step": 440000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 7.574463196057906,
+  "global_step": 445000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.4943207748699148e-05,
       "loss": 0.3192,
       "step": 440000
+    },
+    {
+      "epoch": 7.5,
+      "learning_rate": 1.4862516814602821e-05,
+      "loss": 0.3191,
+      "step": 440500
+    },
+    {
+      "epoch": 7.51,
+      "learning_rate": 1.478230641353945e-05,
+      "loss": 0.3189,
+      "step": 441000
+    },
+    {
+      "epoch": 7.51,
+      "learning_rate": 1.4702739684782337e-05,
+      "loss": 0.319,
+      "step": 441500
+    },
+    {
+      "epoch": 7.52,
+      "learning_rate": 1.4623817413622956e-05,
+      "loss": 0.319,
+      "step": 442000
+    },
+    {
+      "epoch": 7.53,
+      "learning_rate": 1.4545696288600928e-05,
+      "loss": 0.3193,
+      "step": 442500
+    },
+    {
+      "epoch": 7.54,
+      "learning_rate": 1.4468063970276709e-05,
+      "loss": 0.3191,
+      "step": 443000
+    },
+    {
+      "epoch": 7.55,
+      "learning_rate": 1.4391078425704797e-05,
+      "loss": 0.319,
+      "step": 443500
+    },
+    {
+      "epoch": 7.56,
+      "learning_rate": 1.4314740414701418e-05,
+      "loss": 0.319,
+      "step": 444000
+    },
+    {
+      "epoch": 7.57,
+      "learning_rate": 1.423905069069194e-05,
+      "loss": 0.3191,
+      "step": 444500
+    },
+    {
+      "epoch": 7.57,
+      "learning_rate": 1.4164010000703365e-05,
+      "loss": 0.319,
+      "step": 445000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4b3d022a38f882829086501961b7aec842ba9d1cefbd1f74a31fb9e986a1e317
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:03b07a4229a48459c79e80fe855bce597db6900e72bddc707e70f6fbfdf9dfe9
 size 201355195