Training in progress, step 90000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e51fe3d77cc9e74a03015a679bf9c6e5b20948a91fec3a0a678f7ab3d632266b
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ec6dc111e6167617249a4034f667ff8c1dac4e0508b2d117f87c2a48b53f992
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c035316a6d8fc5afe7f4bf5263646f9d28003e5dc92f6d7d8ca0dfcd6793a547
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:fd1a954286945255af2c2f6a9caa52188dcc39909af1998372c65c068243f847
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:366fcf2af7e77643d8ba291b8a66dfb537d4ef759595fd9e7a945bd15b02507a
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:fd75299155a785e038cc2034bc0ffae9f55e960c94bd0d7eeb1f0123fe91a7b9
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d3ec4b721b64709a3029a0a2cb04e18d166896dfa34d7fdfc8143f8d8565fa60
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:1a9f62023cae76e82d48aee2a952f4c6d76c642cc4db4f90dd6af1d183efff25
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4fb92796b14e92fd63e400d0d94dcf933348fe7696852142cff135a6ac92eff3
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:6fb5901ddeb1cfbe18f3314a87d55dbe2efa71565718ac2ab36838d79b0ca129
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:58ff7b8548b63f48264cef8154875e50044ff9178a1ba8dad705f9e679474825
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:143c38b79821877e7c44d516c39a7e7355c53315c2e2279c91582047957f2c7c
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:42b6574b57c2570000c9af4e77bbf53b450e6d4b62d98188361ee6a5f2aaa995
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:03c7bc8447e7ec329f5ebcdbdba23f6503dd9b1599722a7f3d541e97e65b905e
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:345b6e5a884c94f439eac86a159284d4991183aeed3398174ad1ad011c4a43d7
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:88745b2213b88b884ae47af09195b94e85097099ce2e5b5e82db98c713a418d9
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.446804708045038,
-  "global_step": 85000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1026,6 +1026,66 @@
       "learning_rate": 0.00014025955271103284,
       "loss": 0.3529,
       "step": 85000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.5319103667202834,
+  "global_step": 90000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00014025955271103284,
       "loss": 0.3529,
       "step": 85000
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 0.00014014735191195807,
+      "loss": 0.3528,
+      "step": 85500
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 0.00014003478366336457,
+      "loss": 0.3527,
+      "step": 86000
+    },
+    {
+      "epoch": 1.47,
+      "learning_rate": 0.00013992253468820287,
+      "loss": 0.3559,
+      "step": 86500
+    },
+    {
+      "epoch": 1.48,
+      "learning_rate": 0.00013980856343455598,
+      "loss": 0.3566,
+      "step": 87000
+    },
+    {
+      "epoch": 1.49,
+      "learning_rate": 0.0001396940018945337,
+      "loss": 0.3554,
+      "step": 87500
+    },
+    {
+      "epoch": 1.5,
+      "learning_rate": 0.00013957885119881218,
+      "loss": 0.3552,
+      "step": 88000
+    },
+    {
+      "epoch": 1.51,
+      "learning_rate": 0.00013946311248388228,
+      "loss": 0.3548,
+      "step": 88500
+    },
+    {
+      "epoch": 1.51,
+      "learning_rate": 0.00013934678689203836,
+      "loss": 0.3547,
+      "step": 89000
+    },
+    {
+      "epoch": 1.52,
+      "learning_rate": 0.0001392298755713671,
+      "loss": 0.3547,
+      "step": 89500
+    },
+    {
+      "epoch": 1.53,
+      "learning_rate": 0.00013911237967573605,
+      "loss": 0.3541,
+      "step": 90000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c035316a6d8fc5afe7f4bf5263646f9d28003e5dc92f6d7d8ca0dfcd6793a547
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:fd1a954286945255af2c2f6a9caa52188dcc39909af1998372c65c068243f847
 size 201355195