Training in progress, step 315000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:11ba1af3ca07f05b59a0f9d045b8502a890e39d6d713b1a68a79774487c538c4
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:986fd930859453f0bbb0a52eeb57549a8b1316f1d1780247ecfbfe0f9a13119a
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:33044061cdae69282e0841e3fa8fb5cc7bb7ba2c335ee94c43ec527fde5de60a
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:6eaf07203b519520199a41cc0c67ab543d94d3933f85b837c948f43b77677714
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d9e955485a8b6c2204c1cd05e7146bc3d8d4aea199220bdeb0763bf9b3fe4990
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:24be0beac655ccefbd3a84f5d3c8a9b96e97783841928199a33ad24a6531cc6e
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a40eb8bd77540d5f51aa2626d7dc28a426fa540c25aaff397ab33d9c2cfc9ca6
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:d9256796205b256efab4335c109c6da5a97f9254e1c45b4078531f232bcc477d
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aedd0ee2fba46776b8e9a3d54ff8ed40a6879de49804fa15d3dcd9b89d1ec8a0
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:f4f5cd324a541d3750857dce2626abd84585cc9b30b3c32ed627ee4167a9d0ba
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bbedddb259fec8d39a25799576be00b42005bed9171320d734f89be1d9f42f86
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:0ab7c0f0bc621de2c5e939fcd33f672573ad2f2ec8475c89ffb269bf1acc13d9
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:513b23ca2b61699867f7e4f0e83f6e0bf3f9836045ea9437165be2c511401531
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:dfae2ab72f777b3d01d09d07dc27793ce81bf079fbb253f8b977c5c09b6be3aa
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1db0c9d6f53ee9862fd806add4b35c4edb1edf9c5abd3a62a1824f925a04677b
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:b2d58cc217d81f79958e9cab10c1ba79a5a9ada49617d3342ddc9e114493bf73
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 5.276593390694547,
-  "global_step": 310000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -3726,6 +3726,66 @@
       "learning_rate": 5.428158826048664e-05,
       "loss": 0.3249,
       "step": 310000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 5.3616990493697925,
+  "global_step": 315000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 5.428158826048664e-05,
       "loss": 0.3249,
       "step": 310000
+    },
+    {
+      "epoch": 5.29,
+      "learning_rate": 5.407718448027968e-05,
+      "loss": 0.3248,
+      "step": 310500
+    },
+    {
+      "epoch": 5.29,
+      "learning_rate": 5.387303654779643e-05,
+      "loss": 0.3245,
+      "step": 311000
+    },
+    {
+      "epoch": 5.3,
+      "learning_rate": 5.3669146477894576e-05,
+      "loss": 0.3245,
+      "step": 311500
+    },
+    {
+      "epoch": 5.31,
+      "learning_rate": 5.3465516282886794e-05,
+      "loss": 0.3245,
+      "step": 312000
+    },
+    {
+      "epoch": 5.32,
+      "learning_rate": 5.32621479725209e-05,
+      "loss": 0.3245,
+      "step": 312500
+    },
+    {
+      "epoch": 5.33,
+      "learning_rate": 5.305904355396001e-05,
+      "loss": 0.3244,
+      "step": 313000
+    },
+    {
+      "epoch": 5.34,
+      "learning_rate": 5.285620503176271e-05,
+      "loss": 0.3243,
+      "step": 313500
+    },
+    {
+      "epoch": 5.34,
+      "learning_rate": 5.265363440786338e-05,
+      "loss": 0.3244,
+      "step": 314000
+    },
+    {
+      "epoch": 5.35,
+      "learning_rate": 5.2451333681552255e-05,
+      "loss": 0.3241,
+      "step": 314500
+    },
+    {
+      "epoch": 5.36,
+      "learning_rate": 5.2249304849455853e-05,
+      "loss": 0.3243,
+      "step": 315000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:33044061cdae69282e0841e3fa8fb5cc7bb7ba2c335ee94c43ec527fde5de60a
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:6eaf07203b519520199a41cc0c67ab543d94d3933f85b837c948f43b77677714
 size 201355195