Training in progress, step 135000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f690f84228c1cf7c536edbf2267bc0cdfd0f89ce3c54b91efac1cb60aa94cad0
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:928c3746f9382b349fc28e80d04b5a20158395105d5217c3005ba37255c3ca77
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9ec2a9e31c576538f128ada4a29cf915346ae2568cbf6b58a244e46c6f147e84
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:5110cd9554e14b21510435e745dab095b01a66799fa13e3282560ca1e6c45499
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5eb0ca6b4aedddaec2485b3f9da640a30b0d0c4a6748d79ba9759fcf1059aafe
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:d0b1514696acbea535d08573a1b2d3b31938bfb72bfeab4eb11f6d2373802be4
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ee3ef0876874dbc2e513a558038a6c2a16a643066aa73749397a26d9e6da45a3
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:8499b7e9d1a8145db60bfc50cf0edd03d252ca1ec45abe3f044e258613563f47
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7d6c5f43829cf907e0e5f04a8918256c0a34c747002f9f1dcacccf8010756aff
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:61efa3d107ffd4c591af8bc6122fbe036d89c50d1c5b1e286246a90e3c68104b
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:393742d5819ac3df5ee9648fcf8701d7dbb1400b0807804e7126483e0b53ae3a
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:d5e1eec7327c005bf9146420cdca2e2d7329d76afea935314537cbb31fdce8bb
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b1908f20d92a8293a342e348b5b074ab1cd3d720accabd7a844bf778768c4405
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ef237e3efe3b0130f216c0e5b4fc7b0739fb6103cc4ce8392328f95e9b9e2c6
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9cba00ab4119ca26f6b23d0c7741da241151231837b95816f094795ad39dadf1
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:1a2aef2a9ec660505c33a59d4501ad8e14372a86baef2bf2887bd89652ca5ea7
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.2127659574468086,
-  "global_step": 130000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1566,6 +1566,66 @@
       "learning_rate": 0.00012793432590746354,
       "loss": 0.3432,
       "step": 130000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.297872340425532,
+  "global_step": 135000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00012793432590746354,
       "loss": 0.3432,
       "step": 130000
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 0.00012777382835231195,
+      "loss": 0.343,
+      "step": 130500
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 0.0001276128592887616,
+      "loss": 0.3429,
+      "step": 131000
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 0.00012745174365140025,
+      "loss": 0.3427,
+      "step": 131500
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 0.00012728983727684876,
+      "loss": 0.3426,
+      "step": 132000
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 0.00012712746417069506,
+      "loss": 0.3425,
+      "step": 132500
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 0.00012696462593549614,
+      "loss": 0.3426,
+      "step": 133000
+    },
+    {
+      "epoch": 2.27,
+      "learning_rate": 0.0001268013241783996,
+      "loss": 0.3421,
+      "step": 133500
+    },
+    {
+      "epoch": 2.28,
+      "learning_rate": 0.00012663756051112788,
+      "loss": 0.3421,
+      "step": 134000
+    },
+    {
+      "epoch": 2.29,
+      "learning_rate": 0.00012647333654996226,
+      "loss": 0.3419,
+      "step": 134500
+    },
+    {
+      "epoch": 2.3,
+      "learning_rate": 0.00012630898373767156,
+      "loss": 0.342,
+      "step": 135000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9ec2a9e31c576538f128ada4a29cf915346ae2568cbf6b58a244e46c6f147e84
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:5110cd9554e14b21510435e745dab095b01a66799fa13e3282560ca1e6c45499
 size 201355195