Training in progress, step 630000

Files changed (11) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:30cd8050cb6404088c5716079148dd0da70144e4be8ff9a3d8b384acf70755c2
 size 3871544599

 version https://git-lfs.github.com/spec/v1
+oid sha256:4e6d1b247617f454f8aba2d725b4b716e0e51b61999906e6bdb1b6bb40ec3856
 size 3871544599

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:05ee9a7da46e1a224189b23b0c2c4d8a9bfe97d804c74a078fe32f5d0875aad1
 size 1944201353

 version https://git-lfs.github.com/spec/v1
+oid sha256:f825359cc32e06cdd2a780f075f408d8b0f23a0b1be16adda6020c3fee000f02
 size 1944201353

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:76cbb628e04923671f85d7d99e49cf45496fe34ffb57a5111e03658d124a7d16
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:15a1f862e56bea0c697db0f7c551b1c23f429cc092728541a372282c506543b9
 size 14575

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6143b27eaf96690bbe891751f24c600c4892dab7823d8c13fb59f1cc963b65c0
 size 557

 version https://git-lfs.github.com/spec/v1
+oid sha256:e7470e23b2c705976001439269366835bc44d2ce969c2d60f638dc1ef7d70370
 size 557

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:58e6a28fc1607a90c71dc0e11a421f4fc6f6121d48134da179bd1cba7f5481db
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:9dfdf862b25dade6b656c8ca945dace95c219bab8aa3565ea0e06857dfb4e22a
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 16.435971102326704,
-  "global_step": 627000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -7530,11 +7530,47 @@
       "learning_rate": 3.8297124131692177e-07,
       "loss": 1.0129,
       "step": 627000
     }
   ],
   "max_steps": 762960,
   "num_train_epochs": 20,
-  "total_flos": 7.466521265780244e+17,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 16.514621845215004,
+  "global_step": 630000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 3.8297124131692177e-07,
       "loss": 1.0129,
       "step": 627000
+    },
+    {
+      "epoch": 16.45,
+      "learning_rate": 3.802380513016235e-07,
+      "loss": 1.0221,
+      "step": 627500
+    },
+    {
+      "epoch": 16.46,
+      "learning_rate": 3.775138463912581e-07,
+      "loss": 1.0119,
+      "step": 628000
+    },
+    {
+      "epoch": 16.48,
+      "learning_rate": 3.7479863813300294e-07,
+      "loss": 1.0212,
+      "step": 628500
+    },
+    {
+      "epoch": 16.49,
+      "learning_rate": 3.7209243803590006e-07,
+      "loss": 1.0243,
+      "step": 629000
+    },
+    {
+      "epoch": 16.5,
+      "learning_rate": 3.69395257570809e-07,
+      "loss": 1.025,
+      "step": 629500
+    },
+    {
+      "epoch": 16.51,
+      "learning_rate": 3.6671247544857765e-07,
+      "loss": 1.0369,
+      "step": 630000
     }
   ],
   "max_steps": 762960,
   "num_train_epochs": 20,
+  "total_flos": 7.499479244393595e+17,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b5a7858cb286d248a8d1b95c7338f74eac69d03a9b32f71567312088ea225a92
 size 3771

 version https://git-lfs.github.com/spec/v1
+oid sha256:a817e83c25ddaa8901cfc233f35e575b7ed2a8f04ee848f1df7a6ce2254ee042
 size 3771

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:05ee9a7da46e1a224189b23b0c2c4d8a9bfe97d804c74a078fe32f5d0875aad1
 size 1944201353

 version https://git-lfs.github.com/spec/v1
+oid sha256:f825359cc32e06cdd2a780f075f408d8b0f23a0b1be16adda6020c3fee000f02
 size 1944201353

runs/Jun03_20-07-36_5814eb69ea9a/1685824428.675766/events.out.tfevents.1685824428.5814eb69ea9a.704.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a45957087d60ba82cebff2e1ba5034a47961917d8f0acd8b366e1c31721030cc
+size 6184

runs/Jun03_20-07-36_5814eb69ea9a/events.out.tfevents.1685824428.5814eb69ea9a.704.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b7fa3c5c4fd8134e8f1b69a09e298c911d8d89cd9a0733740e8195019ea66202
+size 5421

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b5a7858cb286d248a8d1b95c7338f74eac69d03a9b32f71567312088ea225a92
 size 3771

 version https://git-lfs.github.com/spec/v1
+oid sha256:a817e83c25ddaa8901cfc233f35e575b7ed2a8f04ee848f1df7a6ce2254ee042
 size 3771