Training in progress, step 570000

Files changed (11) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0da1ef405740ede16d7c81baf88ec88973e8fcbdb441ce52917b61f712d50fc0
 size 3871544599

 version https://git-lfs.github.com/spec/v1
+oid sha256:0d2f2d7d2cadbcd7aceb96a8defa15be9235cf2861e0762840aae2beea42ec13
 size 3871544599

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:30709e207b36718f536b16a253013a71842dd622a44ba8805bf0b4c0e036417e
 size 1944201353

 version https://git-lfs.github.com/spec/v1
+oid sha256:b9b07757646176e92f8dcba8a0fbcd8bbbd32524a0ba9b8949cb9efe6972db82
 size 1944201353

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:99a96597fb2e1218053ef212278689f52ea58dd9e21b8f390d7cd19d045f98a5
-size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:682d8f5af9a928814c1aa2cae346952f943ae20f0591da8254fd1d084226fa01
+size 14511

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b50bf29af3be0d17d88e7de04f70adad4d116ed5c7e38513d419e8bfa3b773c3
 size 557

 version https://git-lfs.github.com/spec/v1
+oid sha256:a5970b634b76e24683de44b37ff55f568f86fe0760701f4b9ffa126dee06d439
 size 557

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a8a396b9aaa2353ce80b393afce7b647bf5bd3d6f87f372056aee44a65a4f72f
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:cc780bf13ad434a35e5ae2b895926fba6c88685df4820697e037e902660ebe70
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 14.863155466546434,
-  "global_step": 567000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -6810,11 +6810,47 @@
       "learning_rate": 7.72271099597614e-07,
       "loss": 1.0389,
       "step": 567000
     }
   ],
   "max_steps": 762960,
   "num_train_epochs": 20,
-  "total_flos": 6.80622136053203e+17,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 14.941795724067065,
+  "global_step": 570000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 7.72271099597614e-07,
       "loss": 1.0389,
       "step": 567000
+    },
+    {
+      "epoch": 14.88,
+      "learning_rate": 7.685546472145017e-07,
+      "loss": 1.0438,
+      "step": 567500
+    },
+    {
+      "epoch": 14.89,
+      "learning_rate": 7.648603557785422e-07,
+      "loss": 1.0359,
+      "step": 568000
+    },
+    {
+      "epoch": 14.9,
+      "learning_rate": 7.6115856793579e-07,
+      "loss": 1.0527,
+      "step": 568500
+    },
+    {
+      "epoch": 14.92,
+      "learning_rate": 7.574715320461648e-07,
+      "loss": 1.034,
+      "step": 569000
+    },
+    {
+      "epoch": 14.93,
+      "learning_rate": 7.537844860442989e-07,
+      "loss": 1.0461,
+      "step": 569500
+    },
+    {
+      "epoch": 14.94,
+      "learning_rate": 7.50104841783765e-07,
+      "loss": 1.0558,
+      "step": 570000
     }
   ],
   "max_steps": 762960,
   "num_train_epochs": 20,
+  "total_flos": 6.839220162824847e+17,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:db7f226016ec8dafc1c7095c0a76c7cf4c4a8a99df76a02ac45265015885b594
 size 3771

 version https://git-lfs.github.com/spec/v1
+oid sha256:46b3a87459854f08d80f4fb8cbdd6dbf69afb36e65aeb8868750af0e1c3b25c3
 size 3771

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:30709e207b36718f536b16a253013a71842dd622a44ba8805bf0b4c0e036417e
 size 1944201353

 version https://git-lfs.github.com/spec/v1
+oid sha256:b9b07757646176e92f8dcba8a0fbcd8bbbd32524a0ba9b8949cb9efe6972db82
 size 1944201353

runs/Jun01_02-00-15_72d6bfb1a401/1685586378.6154885/events.out.tfevents.1685586378.72d6bfb1a401.2268.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:9551b3f358861a603b4ad3dd373c1de5b81224e41cd003794b30a06e5b1d93e3
+size 6184

runs/Jun01_02-00-15_72d6bfb1a401/events.out.tfevents.1685586378.72d6bfb1a401.2268.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:af84064e46c023b2e7c8f52a9f6ca52513f50bcd2868568b383555c16d38fda3
+size 5421

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:db7f226016ec8dafc1c7095c0a76c7cf4c4a8a99df76a02ac45265015885b594
 size 3771

 version https://git-lfs.github.com/spec/v1
+oid sha256:46b3a87459854f08d80f4fb8cbdd6dbf69afb36e65aeb8868750af0e1c3b25c3
 size 3771