Training in progress, step 1000000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Dec27_23-39-04_t1v-n-6071ee6f-w-0/events.out.tfevents.1672184365.t1v-n-6071ee6f-w-0.108001.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:69c2a3f0d71cdb35d08c4188dc0759de44bd72d54dd0e64ce39a1cc599afb440
 size 885325017

 version https://git-lfs.github.com/spec/v1
+oid sha256:b6709c31ff0729a1d7c432a7387ac7045f87daa988613a212726f338bc80a9f5
 size 885325017

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c65138ee8a8889f23fd090f031b33c3c7187319b021a3e7673c53dffc8e14f9e
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:92b18fe4bb5da26c52d0fd64a7e1283a9392787bf8fa2100118119861935f53c
 size 442675755

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a3146b2cf60fe575602b3dab14d07f2e3b1c9322dc666bc5e2455f1aba9e69d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:d1c696e3facd4608b3fc117b6b37f55cf9f2b0bc62746ffe7180114a3b5d128e
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a3146b2cf60fe575602b3dab14d07f2e3b1c9322dc666bc5e2455f1aba9e69d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:d1c696e3facd4608b3fc117b6b37f55cf9f2b0bc62746ffe7180114a3b5d128e
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a3146b2cf60fe575602b3dab14d07f2e3b1c9322dc666bc5e2455f1aba9e69d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:d1c696e3facd4608b3fc117b6b37f55cf9f2b0bc62746ffe7180114a3b5d128e
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a3146b2cf60fe575602b3dab14d07f2e3b1c9322dc666bc5e2455f1aba9e69d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:d1c696e3facd4608b3fc117b6b37f55cf9f2b0bc62746ffe7180114a3b5d128e
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a3146b2cf60fe575602b3dab14d07f2e3b1c9322dc666bc5e2455f1aba9e69d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:d1c696e3facd4608b3fc117b6b37f55cf9f2b0bc62746ffe7180114a3b5d128e
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a3146b2cf60fe575602b3dab14d07f2e3b1c9322dc666bc5e2455f1aba9e69d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:d1c696e3facd4608b3fc117b6b37f55cf9f2b0bc62746ffe7180114a3b5d128e
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a3146b2cf60fe575602b3dab14d07f2e3b1c9322dc666bc5e2455f1aba9e69d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:d1c696e3facd4608b3fc117b6b37f55cf9f2b0bc62746ffe7180114a3b5d128e
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a3146b2cf60fe575602b3dab14d07f2e3b1c9322dc666bc5e2455f1aba9e69d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:d1c696e3facd4608b3fc117b6b37f55cf9f2b0bc62746ffe7180114a3b5d128e
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc2c2c8416f63b11e9c82d6dac05baa6ad73177ac658621e099b23ff71f2f801
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:906bc3ed48818cc1785b6a98c1e064532a322520b99cdf458cfd827674d9b7ec
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 6.073748,
-  "global_step": 950000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -5858,11 +5858,319 @@
       "eval_samples_per_second": 447.176,
       "eval_steps_per_second": 3.577,
       "step": 950000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 1.6003204479826526e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 6.123748,
+  "global_step": 1000000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 447.176,
       "eval_steps_per_second": 3.577,
       "step": 950000
+    },
+    {
+      "epoch": 6.07,
+      "learning_rate": 6.549893279788277e-07,
+      "loss": 0.6979,
+      "step": 951000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 6.285834552247128e-07,
+      "loss": 0.6093,
+      "step": 952000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 6.027175003719354e-07,
+      "loss": 0.5832,
+      "step": 953000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 5.773917462864264e-07,
+      "loss": 0.6034,
+      "step": 954000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 5.526064699265753e-07,
+      "loss": 0.7171,
+      "step": 955000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 5.283619423401998e-07,
+      "loss": 0.6829,
+      "step": 956000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 5.046584286615697e-07,
+      "loss": 0.6362,
+      "step": 957000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 4.814961881085045e-07,
+      "loss": 0.5757,
+      "step": 958000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 4.5887547397955864e-07,
+      "loss": 0.6047,
+      "step": 959000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 4.367965336512403e-07,
+      "loss": 0.6948,
+      "step": 960000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 4.1525960857530243e-07,
+      "loss": 0.7152,
+      "step": 961000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 3.9426493427611177e-07,
+      "loss": 0.6197,
+      "step": 962000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 3.738127403480507e-07,
+      "loss": 0.5809,
+      "step": 963000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 3.5390325045304706e-07,
+      "loss": 0.5836,
+      "step": 964000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 3.3453668231809286e-07,
+      "loss": 0.7279,
+      "step": 965000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 3.157132477328628e-07,
+      "loss": 0.6954,
+      "step": 966000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 2.9743315254743833e-07,
+      "loss": 0.6144,
+      "step": 967000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 2.796965966699927e-07,
+      "loss": 0.5801,
+      "step": 968000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 2.625037740646763e-07,
+      "loss": 0.6001,
+      "step": 969000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 2.458548727494292e-07,
+      "loss": 0.7176,
+      "step": 970000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 2.2975007479397738e-07,
+      "loss": 0.6872,
+      "step": 971000
+    },
+    {
+      "epoch": 6.1,
+      "learning_rate": 2.1418955631781202e-07,
+      "loss": 0.6369,
+      "step": 972000
+    },
+    {
+      "epoch": 6.1,
+      "learning_rate": 1.9917348748826335e-07,
+      "loss": 0.5778,
+      "step": 973000
+    },
+    {
+      "epoch": 6.1,
+      "learning_rate": 1.847020325186577e-07,
+      "loss": 0.599,
+      "step": 974000
+    },
+    {
+      "epoch": 6.1,
+      "learning_rate": 1.7077534966650766e-07,
+      "loss": 0.6961,
+      "step": 975000
+    },
+    {
+      "epoch": 6.1,
+      "learning_rate": 1.5739359123178587e-07,
+      "loss": 0.7163,
+      "step": 976000
+    },
+    {
+      "epoch": 6.1,
+      "learning_rate": 1.4455690355525964e-07,
+      "loss": 0.6199,
+      "step": 977000
+    },
+    {
+      "epoch": 6.1,
+      "learning_rate": 1.3226542701689215e-07,
+      "loss": 0.5833,
+      "step": 978000
+    },
+    {
+      "epoch": 6.1,
+      "learning_rate": 1.2051929603428825e-07,
+      "loss": 0.5774,
+      "step": 979000
+    },
+    {
+      "epoch": 6.1,
+      "learning_rate": 1.0931863906127327e-07,
+      "loss": 0.7263,
+      "step": 980000
+    },
+    {
+      "epoch": 6.1,
+      "learning_rate": 9.866357858642205e-08,
+      "loss": 0.6966,
+      "step": 981000
+    },
+    {
+      "epoch": 6.11,
+      "learning_rate": 8.855423113177664e-08,
+      "loss": 0.6213,
+      "step": 982000
+    },
+    {
+      "epoch": 6.11,
+      "learning_rate": 7.899070725153613e-08,
+      "loss": 0.579,
+      "step": 983000
+    },
+    {
+      "epoch": 6.11,
+      "learning_rate": 6.997311153086883e-08,
+      "loss": 0.6005,
+      "step": 984000
+    },
+    {
+      "epoch": 6.11,
+      "learning_rate": 6.150154258476315e-08,
+      "loss": 0.7129,
+      "step": 985000
+    },
+    {
+      "epoch": 6.11,
+      "learning_rate": 5.3576093056922906e-08,
+      "loss": 0.6897,
+      "step": 986000
+    },
+    {
+      "epoch": 6.11,
+      "learning_rate": 4.619684961881254e-08,
+      "loss": 0.6395,
+      "step": 987000
+    },
+    {
+      "epoch": 6.11,
+      "learning_rate": 3.936389296864129e-08,
+      "loss": 0.5797,
+      "step": 988000
+    },
+    {
+      "epoch": 6.11,
+      "learning_rate": 3.3077297830541584e-08,
+      "loss": 0.5937,
+      "step": 989000
+    },
+    {
+      "epoch": 6.11,
+      "learning_rate": 2.7337132953697554e-08,
+      "loss": 0.6948,
+      "step": 990000
+    },
+    {
+      "epoch": 6.11,
+      "learning_rate": 2.214346111164556e-08,
+      "loss": 0.7171,
+      "step": 991000
+    },
+    {
+      "epoch": 6.12,
+      "learning_rate": 1.749633910153592e-08,
+      "loss": 0.6254,
+      "step": 992000
+    },
+    {
+      "epoch": 6.12,
+      "learning_rate": 1.3395817743561134e-08,
+      "loss": 0.5856,
+      "step": 993000
+    },
+    {
+      "epoch": 6.12,
+      "learning_rate": 9.841941880361916e-09,
+      "loss": 0.5713,
+      "step": 994000
+    },
+    {
+      "epoch": 6.12,
+      "learning_rate": 6.834750376549792e-09,
+      "loss": 0.7225,
+      "step": 995000
+    },
+    {
+      "epoch": 6.12,
+      "learning_rate": 4.3742761183018784e-09,
+      "loss": 0.6983,
+      "step": 996000
+    },
+    {
+      "epoch": 6.12,
+      "learning_rate": 2.4605460129556445e-09,
+      "loss": 0.626,
+      "step": 997000
+    },
+    {
+      "epoch": 6.12,
+      "learning_rate": 1.0935809887702154e-09,
+      "loss": 0.5772,
+      "step": 998000
+    },
+    {
+      "epoch": 6.12,
+      "learning_rate": 2.7339599464326627e-10,
+      "loss": 0.598,
+      "step": 999000
+    },
+    {
+      "epoch": 6.12,
+      "learning_rate": 0.0,
+      "loss": 0.7085,
+      "step": 1000000
+    },
+    {
+      "epoch": 6.12,
+      "eval_loss": 0.47990772128105164,
+      "eval_runtime": 10.5537,
+      "eval_samples_per_second": 473.766,
+      "eval_steps_per_second": 3.79,
+      "step": 1000000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 1.6845474410117726e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c65138ee8a8889f23fd090f031b33c3c7187319b021a3e7673c53dffc8e14f9e
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:92b18fe4bb5da26c52d0fd64a7e1283a9392787bf8fa2100118119861935f53c
 size 442675755

runs/Dec27_23-39-04_t1v-n-6071ee6f-w-0/events.out.tfevents.1672184365.t1v-n-6071ee6f-w-0.108001.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3416fba1663bed0ceb7da268696a6250ba565b786001d9ed7fe5a803fca0224a
-size 160977

 version https://git-lfs.github.com/spec/v1
+oid sha256:00318c70372e189e574b61ad78972e58f0a1a6d389587262a37adad04212402a
+size 169253