Training in progress, step 365000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f9bb647830011f1f0c4939bdfd58513ca8d1b6b369f0f905ba5d1b59dff0d694
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:4f7dc68662c82c6ffbedd49f2076ab28a2c01e48540614ce2f174a82223716ed
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7697a15ef9673439312fb036c35de00fc97c3f08924c4d9a382535bc3e9dd969
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:0696c7f5ae19cb889783a904f338158b48f61bac33c2488b7805a376c9387ff9
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aac6ab5786efe14d88a6dfd5c47656ff2718062b841d7abdc16c78094b2cc8d5
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:a9814acc3b57dc08524e0312f095af7ed7dfbb32d1dc12c13c3e82715351d160
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5c94c7c084b365de19772f29fe1d2ffdd18e2bd3f744bc288dfa9981c05f383e
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:cb6d0a859d60adef9c8fe8ecfc6811c66d512f2c7bc8e8e2bc033710665ec541
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:867e91d51677fc0001645b808eefef44c8c1a86f4c9210d1d3576b946cebac35
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:889772b5bbee7f72c148bc34b08a45896a822f63a7afe8ab5db2d7f65588263c
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:434def7e802ff1b8a0587a049f8cb9ff64f00a3dc17caa9f58fe716c7c9ce5bd
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:da9aedaff3157e59f253dc3a5b6a6100df76d1279d035f184adbb4b5eb1551ed
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e1e4bec7cc11f69c6b820a428063a4e9aab696285a5c1947c10e8d9e21010fca
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:e8fb9b18d70589928b384e18f28370eb0d78024bdf16f6b9c2c6b57b8dcc9be8
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:74433998881e570fe5797566e28e4a779b8ade1b81209fbf1fa056d46d071355
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:910ecb4645c6ef73635557af0ae3d409a37a838e704079ef7d2edea1a467a58d
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 6.127658488012868,
-  "global_step": 360000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -4326,6 +4326,66 @@
       "learning_rate": 3.5428460769004264e-05,
       "loss": 0.3216,
       "step": 360000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 6.212764146688113,
+  "global_step": 365000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 3.5428460769004264e-05,
       "loss": 0.3216,
       "step": 360000
+    },
+    {
+      "epoch": 6.14,
+      "learning_rate": 3.525911128741588e-05,
+      "loss": 0.3217,
+      "step": 360500
+    },
+    {
+      "epoch": 6.14,
+      "learning_rate": 3.5090203380336435e-05,
+      "loss": 0.3216,
+      "step": 361000
+    },
+    {
+      "epoch": 6.15,
+      "learning_rate": 3.4921738714818835e-05,
+      "loss": 0.3216,
+      "step": 361500
+    },
+    {
+      "epoch": 6.16,
+      "learning_rate": 3.4753718953541264e-05,
+      "loss": 0.3216,
+      "step": 362000
+    },
+    {
+      "epoch": 6.17,
+      "learning_rate": 3.458614575479098e-05,
+      "loss": 0.3216,
+      "step": 362500
+    },
+    {
+      "epoch": 6.18,
+      "learning_rate": 3.441902077244776e-05,
+      "loss": 0.3218,
+      "step": 363000
+    },
+    {
+      "epoch": 6.19,
+      "learning_rate": 3.425234565596775e-05,
+      "loss": 0.3216,
+      "step": 363500
+    },
+    {
+      "epoch": 6.2,
+      "learning_rate": 3.4086454045879215e-05,
+      "loss": 0.3217,
+      "step": 364000
+    },
+    {
+      "epoch": 6.2,
+      "learning_rate": 3.39206826837805e-05,
+      "loss": 0.3217,
+      "step": 364500
+    },
+    {
+      "epoch": 6.21,
+      "learning_rate": 3.37553661059407e-05,
+      "loss": 0.3218,
+      "step": 365000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7697a15ef9673439312fb036c35de00fc97c3f08924c4d9a382535bc3e9dd969
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:0696c7f5ae19cb889783a904f338158b48f61bac33c2488b7805a376c9387ff9
 size 201355195