Training in progress, step 165720

Browse files

Files changed (7) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +135 -3
pytorch_model.bin +1 -1
runs/Feb07_05-04-07_5214b674e698/events.out.tfevents.1675746342.5214b674e698.342.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dbacc42ae86d5bffee4563dcf70c2766a33a090badbf37473eee0b4563f66aed
 size 2401461637

 version https://git-lfs.github.com/spec/v1
+oid sha256:d74fdb539d44a35348b6810c0d848c4bf56592bd5cf768ed81575f1ebb8bcb14
 size 2401461637

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2804f7e0374fafd6bfaa3af3801b588460f7b01602d1c491a4b6f5e46a186dd5
 size 1200739717

 version https://git-lfs.github.com/spec/v1
+oid sha256:2a5ec2ac5d923b5dd8a99ca581137ee6c85b4ea12bee1568d23a8455d2a58084
 size 1200739717

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cfde35a2a20f39b9f60c7d190042c042b4211d2fd0cd8241aad27a0edea70786
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:510fc81178791ae60890b99ad1e29739b0a1957018583076b8ffe9ee3580c1d3
 size 14575

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e6a3d083bf875c101097c911b12ddc02254be04dcf3f96b9e69fe4a1f81739c9
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:4d8dac73ce104ca44387089f603547c06c75d1a306882323278557a38f3d277f
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.300913391449228,
-  "global_step": 154672,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1878,11 +1878,143 @@
       "learning_rate": 4.677635297967928e-06,
       "loss": 2.7807,
       "step": 154500
     }
   ],
   "max_steps": 201666,
   "num_train_epochs": 3,
-  "total_flos": 1.8189972538166477e+17,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.4652643479813157,
+  "global_step": 165720,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 4.677635297967928e-06,
       "loss": 2.7807,
       "step": 154500
+    },
+    {
+      "epoch": 2.31,
+      "learning_rate": 4.628048357184653e-06,
+      "loss": 2.7652,
+      "step": 155000
+    },
+    {
+      "epoch": 2.31,
+      "learning_rate": 4.578461416401377e-06,
+      "loss": 2.7918,
+      "step": 155500
+    },
+    {
+      "epoch": 2.32,
+      "learning_rate": 4.528874475618102e-06,
+      "loss": 2.7771,
+      "step": 156000
+    },
+    {
+      "epoch": 2.33,
+      "learning_rate": 4.479287534834827e-06,
+      "loss": 2.7561,
+      "step": 156500
+    },
+    {
+      "epoch": 2.34,
+      "learning_rate": 4.429700594051551e-06,
+      "loss": 2.7789,
+      "step": 157000
+    },
+    {
+      "epoch": 2.34,
+      "learning_rate": 4.380113653268276e-06,
+      "loss": 2.7629,
+      "step": 157500
+    },
+    {
+      "epoch": 2.35,
+      "learning_rate": 4.330526712485001e-06,
+      "loss": 2.7672,
+      "step": 158000
+    },
+    {
+      "epoch": 2.36,
+      "learning_rate": 4.280939771701725e-06,
+      "loss": 2.7643,
+      "step": 158500
+    },
+    {
+      "epoch": 2.37,
+      "learning_rate": 4.23135283091845e-06,
+      "loss": 2.7836,
+      "step": 159000
+    },
+    {
+      "epoch": 2.37,
+      "learning_rate": 4.181765890135175e-06,
+      "loss": 2.7742,
+      "step": 159500
+    },
+    {
+      "epoch": 2.38,
+      "learning_rate": 4.132178949351899e-06,
+      "loss": 2.7504,
+      "step": 160000
+    },
+    {
+      "epoch": 2.39,
+      "learning_rate": 4.082592008568624e-06,
+      "loss": 2.7738,
+      "step": 160500
+    },
+    {
+      "epoch": 2.4,
+      "learning_rate": 4.033005067785349e-06,
+      "loss": 2.7741,
+      "step": 161000
+    },
+    {
+      "epoch": 2.4,
+      "learning_rate": 3.983418127002074e-06,
+      "loss": 2.768,
+      "step": 161500
+    },
+    {
+      "epoch": 2.41,
+      "learning_rate": 3.933831186218798e-06,
+      "loss": 2.7874,
+      "step": 162000
+    },
+    {
+      "epoch": 2.42,
+      "learning_rate": 3.884244245435523e-06,
+      "loss": 2.7733,
+      "step": 162500
+    },
+    {
+      "epoch": 2.42,
+      "learning_rate": 3.834657304652248e-06,
+      "loss": 2.7677,
+      "step": 163000
+    },
+    {
+      "epoch": 2.43,
+      "learning_rate": 3.7850703638689717e-06,
+      "loss": 2.7601,
+      "step": 163500
+    },
+    {
+      "epoch": 2.44,
+      "learning_rate": 3.735483423085696e-06,
+      "loss": 2.7832,
+      "step": 164000
+    },
+    {
+      "epoch": 2.45,
+      "learning_rate": 3.685896482302421e-06,
+      "loss": 2.7704,
+      "step": 164500
+    },
+    {
+      "epoch": 2.45,
+      "learning_rate": 3.6363095415191457e-06,
+      "loss": 2.7698,
+      "step": 165000
+    },
+    {
+      "epoch": 2.46,
+      "learning_rate": 3.5867226007358706e-06,
+      "loss": 2.7724,
+      "step": 165500
     }
   ],
   "max_steps": 201666,
   "num_train_epochs": 3,
+  "total_flos": 1.9488674798095565e+17,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2804f7e0374fafd6bfaa3af3801b588460f7b01602d1c491a4b6f5e46a186dd5
 size 1200739717

 version https://git-lfs.github.com/spec/v1
+oid sha256:2a5ec2ac5d923b5dd8a99ca581137ee6c85b4ea12bee1568d23a8455d2a58084
 size 1200739717

runs/Feb07_05-04-07_5214b674e698/events.out.tfevents.1675746342.5214b674e698.342.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:47793967c6dafaef3b95a29eec188cb0e4f8080e860f73f8f0392fb1553d09fe
-size 54111

 version https://git-lfs.github.com/spec/v1
+oid sha256:b7dd64fd5f5ee57511fff720cbb56340f4a2adf91133fae41a0df73cab017476
+size 57631