Training in progress, step 686663

Files changed (12) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:255d6608627f971b8fa635085e93d9d3736f8faf0307ad98fb42f9842388fe0c
 size 3871544599

 version https://git-lfs.github.com/spec/v1
+oid sha256:a3d505118400b8cc65706219c91d9a0c9e09d95df989221176ade7baf15c1bf7
 size 3871544599

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:042ed029d1ce0685e441b0e9e314fc5bd4a51055225e920c4b72a45accbce0e9
 size 1944201353

 version https://git-lfs.github.com/spec/v1
+oid sha256:b28648855c1812b7c942932e21b3ab1aa9e737a8856b0498e44d5ff6bedae3d3
 size 1944201353

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d0daeb78ed36ddd95353d06116a1c5b99b401a3e3997b8ad9fd1e4f42aebb06c
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:98df663c0d2c6f550aa483476e744f6f0c8c0b14d26daa27cccf7752a403e539
 size 14575

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cf6fe63eebe17142846ff03c21c0294f2edc6e808c40e3289c2aaf11354b4e1b
 size 557

 version https://git-lfs.github.com/spec/v1
+oid sha256:4fb55d22d3c41a6606c4cb3a01f7dfc8dfeeba6f924d365fc5dc46ec19e16d88
 size 557

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:172037b6cd95ec064dde60c2c3ba541c435c94ffb5fdeac7374e280358af38c7
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:38b62db0464eeffe852cfb7f98cb9fdcf103e71f400d5cd41784ebdf1f318be2
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 17.940406412850866,
-  "global_step": 684391,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -8214,11 +8214,41 @@
       "learning_rate": 1.318388022380601e-07,
       "loss": 1.0081,
       "step": 684000
     }
   ],
   "max_steps": 686664,
   "num_train_epochs": 18,
-  "total_flos": 8.098705147455406e+17,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 17.999963301213157,
+  "global_step": 686663,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.318388022380601e-07,
       "loss": 1.0081,
       "step": 684000
+    },
+    {
+      "epoch": 17.94,
+      "learning_rate": 1.541190384118929e-10,
+      "loss": 1.0351,
+      "step": 684500
+    },
+    {
+      "epoch": 17.96,
+      "learning_rate": 9.715872713339514e-11,
+      "loss": 1.0036,
+      "step": 685000
+    },
+    {
+      "epoch": 17.97,
+      "learning_rate": 5.3280415610590384e-11,
+      "loss": 1.0051,
+      "step": 685500
+    },
+    {
+      "epoch": 17.98,
+      "learning_rate": 2.2484333458694384e-11,
+      "loss": 1.0189,
+      "step": 686000
+    },
+    {
+      "epoch": 18.0,
+      "learning_rate": 4.770641833795608e-12,
+      "loss": 1.0073,
+      "step": 686500
     }
   ],
   "max_steps": 686664,
   "num_train_epochs": 18,
+  "total_flos": 8.123676033495859e+17,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:57c294abd9c721e18601dcc394b69c2a686cae3c917a2515ad336aa7cda877f3
 size 3771

 version https://git-lfs.github.com/spec/v1
+oid sha256:c66b8511c8447bf8cefed77f43d3065fb3525af0ff6bef8474faced4e32deedc
 size 3771

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:042ed029d1ce0685e441b0e9e314fc5bd4a51055225e920c4b72a45accbce0e9
 size 1944201353

 version https://git-lfs.github.com/spec/v1
+oid sha256:b28648855c1812b7c942932e21b3ab1aa9e737a8856b0498e44d5ff6bedae3d3
 size 1944201353

runs/Jun10_17-24-57_2db923e410a0/events.out.tfevents.1686417954.2db923e410a0.29875.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c716808413cebb4ed416d22bee2d1c4a3835daca36424ca186b8680c3043a2cf
-size 4463

 version https://git-lfs.github.com/spec/v1
+oid sha256:4508ffec9e376014d67c3740755527327048d0bb90016e1e9197b96c17f37733
+size 5263

runs/Jun10_18-27-22_2db923e410a0/1686421718.1706398/events.out.tfevents.1686421718.2db923e410a0.45518.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6bbe3f8b84ebead3e3f4dd39ba3f4482fb6c0a4080888145ed00463168b58dc
+size 6187

runs/Jun10_18-27-22_2db923e410a0/events.out.tfevents.1686421718.2db923e410a0.45518.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6916063a7da02480eb2f0910d4a0ea9d71383a9733b4ba6ca49ca83f2b415759
+size 5265

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:57c294abd9c721e18601dcc394b69c2a686cae3c917a2515ad336aa7cda877f3
 size 3771

 version https://git-lfs.github.com/spec/v1
+oid sha256:c66b8511c8447bf8cefed77f43d3065fb3525af0ff6bef8474faced4e32deedc
 size 3771