Training in progress, step 360000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d042c59cec9ca6319f1ca8657c391cadbe8eaf315761cd5ec606d56584140104
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:f9bb647830011f1f0c4939bdfd58513ca8d1b6b369f0f905ba5d1b59dff0d694
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5910c0b7a5e3c2f441642ec1a686e8bce121bf28c3af5d75fbbee7b8f68a39ac
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:7697a15ef9673439312fb036c35de00fc97c3f08924c4d9a382535bc3e9dd969
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a465d634594bd5b75a75ce0e093beee314e33a86c1a32d96906e654f0ea9a508
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:aac6ab5786efe14d88a6dfd5c47656ff2718062b841d7abdc16c78094b2cc8d5
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e94c41f141245fd0d3bbd8b776ed1d0976602d4413ffd612c8dcabe5b1c16e6f
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:5c94c7c084b365de19772f29fe1d2ffdd18e2bd3f744bc288dfa9981c05f383e
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c873818117e2135d49af52f5086c668cbc499f08ef0b384fe02105c63537571b
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:867e91d51677fc0001645b808eefef44c8c1a86f4c9210d1d3576b946cebac35
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4acf28e1513a3b98dee0692321b45a7d896bdca216498d541517368d3b26b3dd
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:434def7e802ff1b8a0587a049f8cb9ff64f00a3dc17caa9f58fe716c7c9ce5bd
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:20da87859e2f01ca5bc7bf7171a168a6f7cc2f65bff5aa6987200a210b4bf9c4
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:e1e4bec7cc11f69c6b820a428063a4e9aab696285a5c1947c10e8d9e21010fca
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:689aa3ecff916ec13d78803edfe4eac5ec6a646077f09c3d2c42649c530616f5
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:74433998881e570fe5797566e28e4a779b8ade1b81209fbf1fa056d46d071355
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 6.042552829337622,
-  "global_step": 355000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -4266,6 +4266,66 @@
       "learning_rate": 3.7145176802452735e-05,
       "loss": 0.3223,
       "step": 355000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 6.127658488012868,
+  "global_step": 360000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 3.7145176802452735e-05,
       "loss": 0.3223,
       "step": 355000
+    },
+    {
+      "epoch": 6.05,
+      "learning_rate": 3.697150590953425e-05,
+      "loss": 0.322,
+      "step": 355500
+    },
+    {
+      "epoch": 6.06,
+      "learning_rate": 3.679860575795753e-05,
+      "loss": 0.3219,
+      "step": 356000
+    },
+    {
+      "epoch": 6.07,
+      "learning_rate": 3.6625785068168896e-05,
+      "loss": 0.3218,
+      "step": 356500
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 3.645339246437073e-05,
+      "loss": 0.3218,
+      "step": 357000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 3.6281429648008496e-05,
+      "loss": 0.3216,
+      "step": 357500
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 3.610989831628571e-05,
+      "loss": 0.322,
+      "step": 358000
+    },
+    {
+      "epoch": 6.1,
+      "learning_rate": 3.593880016214741e-05,
+      "loss": 0.3217,
+      "step": 358500
+    },
+    {
+      "epoch": 6.11,
+      "learning_rate": 3.576813687426327e-05,
+      "loss": 0.3218,
+      "step": 359000
+    },
+    {
+      "epoch": 6.12,
+      "learning_rate": 3.5598250153690636e-05,
+      "loss": 0.3217,
+      "step": 359500
+    },
+    {
+      "epoch": 6.13,
+      "learning_rate": 3.5428460769004264e-05,
+      "loss": 0.3216,
+      "step": 360000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5910c0b7a5e3c2f441642ec1a686e8bce121bf28c3af5d75fbbee7b8f68a39ac
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:7697a15ef9673439312fb036c35de00fc97c3f08924c4d9a382535bc3e9dd969
 size 201355195