Training in progress, step 465000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:61aa4e9f023152bed2aa596934d5e42f40b173f755150e912b6614c279f88f16
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:ae04b2af6665d3abd0a5d470b2bf7284897a4bb07c27eee0b6e1ba438decaa9e
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0041fa71647d2cd9df59d7b5cff88993534ca01fdffe6c97ebff4b6b443fd0e2
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:644ad84ef5090cb35e5912b8047809eda9520df938e75c6201875a5342c64fd2
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:224147acac4c428ab25416c74203a796fb9ba398217dbc0d6d069fb51d8ae70c
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:51c7096ef367fe08d551162878490b72e213ab4074868ce645c4d56dbd28b7f8
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:370b0b9e82367f81826a68fe4933489b6c24ac5c097045a65f60cebec12b46ac
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:f6397a75202f41185a5c7f676904b0cdcfc1129c7b082fd80a7c71fec6249b58
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:61a702dfc1727eb7e283876e0762ff2705652ffe9ef399715ec19d685d2566e2
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:fbddd6c4b5409d3e334436c44017507eac79522d187987e8599c405f1a9e9544
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0660e813a1c8e30d9dae8ca6064cf65b21ce2bac86463a2844ddbc8735ffeaee
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:5913a0c5a22066143a6562114115973db2da2530c508c25fc07b079b06992170
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:66e9cea135a1b298a0410e4005fc8f12b63c8c5ab8a3f244d8fe801da116fbca
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:97d81d8dbecd2ea9e42e8620e48d4dcdb6bff10d69a3ce07912303dc15dd9ce5
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:583fe6059dd28557686d7204c7aab4790397f0b6c5f67be3ad8679928fd339be
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:762160864ae4cc7ba8ec08f333d74f30ba91d560ae0a08efd676fd1a9052fbd3
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 7.829780172083642,
-  "global_step": 460000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -5526,6 +5526,66 @@
       "learning_rate": 1.2218580821636874e-05,
       "loss": 0.319,
       "step": 460000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 7.914885830758887,
+  "global_step": 465000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.2218580821636874e-05,
       "loss": 0.319,
       "step": 460000
+    },
+    {
+      "epoch": 7.84,
+      "learning_rate": 1.2163988785682091e-05,
+      "loss": 0.3187,
+      "step": 460500
+    },
+    {
+      "epoch": 7.85,
+      "learning_rate": 1.2110066263771492e-05,
+      "loss": 0.3188,
+      "step": 461000
+    },
+    {
+      "epoch": 7.86,
+      "learning_rate": 1.2056813788098594e-05,
+      "loss": 0.3188,
+      "step": 461500
+    },
+    {
+      "epoch": 7.86,
+      "learning_rate": 1.2004231884243836e-05,
+      "loss": 0.3188,
+      "step": 462000
+    },
+    {
+      "epoch": 7.87,
+      "learning_rate": 1.195242422270528e-05,
+      "loss": 0.3186,
+      "step": 462500
+    },
+    {
+      "epoch": 7.88,
+      "learning_rate": 1.1901285479547943e-05,
+      "loss": 0.3187,
+      "step": 463000
+    },
+    {
+      "epoch": 7.89,
+      "learning_rate": 1.1850715688988035e-05,
+      "loss": 0.3187,
+      "step": 463500
+    },
+    {
+      "epoch": 7.9,
+      "learning_rate": 1.1800818504351289e-05,
+      "loss": 0.3186,
+      "step": 464000
+    },
+    {
+      "epoch": 7.91,
+      "learning_rate": 1.175159441810279e-05,
+      "loss": 0.3187,
+      "step": 464500
+    },
+    {
+      "epoch": 7.91,
+      "learning_rate": 1.1703043916064376e-05,
+      "loss": 0.3188,
+      "step": 465000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0041fa71647d2cd9df59d7b5cff88993534ca01fdffe6c97ebff4b6b443fd0e2
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:644ad84ef5090cb35e5912b8047809eda9520df938e75c6201875a5342c64fd2
 size 201355195