Training in progress, step 440000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:615b67beaebd9fc11db06c2376748df967a3e0597412b5fbc3de1df84085bf30
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:fc0113f382a306d0a0270cc8535391c33e1b2af74c51de2e1c6e0d4578e71f9c
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ef4ded1c570c6515d92814a413bd59666ae763eb46a809315444972ca8266201
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:4b3d022a38f882829086501961b7aec842ba9d1cefbd1f74a31fb9e986a1e317
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c23b9ae5a4f78c49e5f3efe50a5ebccd6e5966ba4b0b8d5764d0403ecb74aac4
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:ed98cd2de93fa24e1ee3c183460e1effd6d0ba45b92a42bfec1f09fdd419d79d
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dbaa614a2f99741bfcaecef4c4718ba56e8945228cbbf85c2b8009964d63bd85
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:363e1050ee631150a25cc4a6efefa58b6bb8d8306f6480ffc47a3c0e8283d574
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a37573b1c526ec4918e05947745d8dab3ff6f75434a218b31f02401e2c40760f
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:70b712440aa43dfef04d3a47555cf899fa15b72d21aa9040c97153ccae5f1d3d
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e554c436f1253409d772e9d5282829d58b498573460fd583fd0185782170b927
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:e73f119d26c8a8d8cbe371942faaf6d5f3c3d949f47febc7dbbe088658221663
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4d4cd1ca0fe0185565e4959b8efebca361d6e5c0d3a4ff3c3b51faf577175581
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:a4e57b8b8ebc2b0b446feb6aa39819ad3fe38c47f0f6f4374fa7a07e55d973d2
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:142284cd18825de16ea2c5e9e3b90ce2a14b040ec54c9e7c11ab653d2cc9c8bb
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:eb2e2a4fb149e5bebf2830e61019116dbdc715ae62bbe8b853e44388c27574ef
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 7.404251878707416,
-  "global_step": 435000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -5226,6 +5226,66 @@
       "learning_rate": 1.578655734817838e-05,
       "loss": 0.3192,
       "step": 435000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 7.48935753738266,
+  "global_step": 440000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.578655734817838e-05,
       "loss": 0.3192,
       "step": 435000
+    },
+    {
+      "epoch": 7.41,
+      "learning_rate": 1.5699323997352622e-05,
+      "loss": 0.3192,
+      "step": 435500
+    },
+    {
+      "epoch": 7.42,
+      "learning_rate": 1.5612725268239792e-05,
+      "loss": 0.3193,
+      "step": 436000
+    },
+    {
+      "epoch": 7.43,
+      "learning_rate": 1.5526762015534355e-05,
+      "loss": 0.3192,
+      "step": 436500
+    },
+    {
+      "epoch": 7.44,
+      "learning_rate": 1.5441435087658935e-05,
+      "loss": 0.3192,
+      "step": 437000
+    },
+    {
+      "epoch": 7.45,
+      "learning_rate": 1.53569140698284e-05,
+      "loss": 0.3193,
+      "step": 437500
+    },
+    {
+      "epoch": 7.46,
+      "learning_rate": 1.5273028503707987e-05,
+      "loss": 0.3191,
+      "step": 438000
+    },
+    {
+      "epoch": 7.46,
+      "learning_rate": 1.518961302104034e-05,
+      "loss": 0.3191,
+      "step": 438500
+    },
+    {
+      "epoch": 7.47,
+      "learning_rate": 1.5106837190727158e-05,
+      "loss": 0.3192,
+      "step": 439000
+    },
+    {
+      "epoch": 7.48,
+      "learning_rate": 1.5024701829732482e-05,
+      "loss": 0.3196,
+      "step": 439500
+    },
+    {
+      "epoch": 7.49,
+      "learning_rate": 1.4943207748699148e-05,
+      "loss": 0.3192,
+      "step": 440000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ef4ded1c570c6515d92814a413bd59666ae763eb46a809315444972ca8266201
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:4b3d022a38f882829086501961b7aec842ba9d1cefbd1f74a31fb9e986a1e317
 size 201355195