Training in progress, step 200000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Feb25_19-21-23_t1v-n-eeadb94b-w-0/events.out.tfevents.1677352917.t1v-n-eeadb94b-w-0.615717.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:840c2c9b1e45544ffd0c8ea1d07aa03a513e11b46e48071199f0c1ef538931b8
 size 2693742553

 version https://git-lfs.github.com/spec/v1
+oid sha256:5b7d49319544a72931f7ee076c508b1a724907fad83b5a899a60bdac334a62f5
 size 2693742553

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:be2cc8073a1e189d84d176885c919af30b3b6d68cc715b0e75c9349edea091c7
 size 1346893675

 version https://git-lfs.github.com/spec/v1
+oid sha256:dc050b6b6cea13715c082c4efde1df4eb7f489a44d07d86d55ddcf0803ea7d10
 size 1346893675

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:04ad030a150fa0d8eb5e5920300951e9645dc85319159f9dd4f177aff4c5b722
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:be1ccf49f4804619cd7d22b74b595a694a368e629a10492b4089d6536d07bdf2
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.15,
-  "global_step": 150000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -930,11 +930,319 @@
       "eval_samples_per_second": 204.744,
       "eval_steps_per_second": 3.235,
       "step": 150000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 8.9474847473664e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.2,
+  "global_step": 200000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 204.744,
       "eval_steps_per_second": 3.235,
       "step": 150000
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 9.723691552302562e-05,
+      "loss": 1.0099,
+      "step": 151000
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 9.718245238567939e-05,
+      "loss": 1.0822,
+      "step": 152000
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 9.712747326859315e-05,
+      "loss": 1.0352,
+      "step": 153000
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 9.707197877300974e-05,
+      "loss": 0.9671,
+      "step": 154000
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 9.701596950580806e-05,
+      "loss": 1.0521,
+      "step": 155000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.695944607949649e-05,
+      "loss": 0.9215,
+      "step": 156000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.690240911220618e-05,
+      "loss": 0.9033,
+      "step": 157000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.684485922768422e-05,
+      "loss": 1.0112,
+      "step": 158000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.6786797055287e-05,
+      "loss": 0.843,
+      "step": 159000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.672822322997305e-05,
+      "loss": 0.9084,
+      "step": 160000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.66691383922964e-05,
+      "loss": 0.8648,
+      "step": 161000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.660954318839933e-05,
+      "loss": 0.7183,
+      "step": 162000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.654943827000548e-05,
+      "loss": 0.8846,
+      "step": 163000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.648882429441257e-05,
+      "loss": 0.8588,
+      "step": 164000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.642770192448536e-05,
+      "loss": 0.9902,
+      "step": 165000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.636607182864827e-05,
+      "loss": 0.937,
+      "step": 166000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.630393468087818e-05,
+      "loss": 0.9826,
+      "step": 167000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.624129116069694e-05,
+      "loss": 1.037,
+      "step": 168000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.617814195316411e-05,
+      "loss": 0.9159,
+      "step": 169000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.611448774886924e-05,
+      "loss": 0.9548,
+      "step": 170000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.605032924392457e-05,
+      "loss": 0.9936,
+      "step": 171000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.598566713995718e-05,
+      "loss": 1.0708,
+      "step": 172000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.59205021441015e-05,
+      "loss": 0.9153,
+      "step": 173000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.58548349689915e-05,
+      "loss": 0.9598,
+      "step": 174000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.578866633275288e-05,
+      "loss": 0.9642,
+      "step": 175000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.572199695899522e-05,
+      "loss": 0.8771,
+      "step": 176000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.565482757680415e-05,
+      "loss": 0.9064,
+      "step": 177000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.558715892073323e-05,
+      "loss": 0.9757,
+      "step": 178000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.551899173079607e-05,
+      "loss": 0.9963,
+      "step": 179000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.545032675245813e-05,
+      "loss": 1.0155,
+      "step": 180000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.538116473662861e-05,
+      "loss": 0.9509,
+      "step": 181000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.531150643965223e-05,
+      "loss": 0.8333,
+      "step": 182000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.524135262330098e-05,
+      "loss": 0.9373,
+      "step": 183000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.517070405476575e-05,
+      "loss": 0.852,
+      "step": 184000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.509956150664796e-05,
+      "loss": 0.9335,
+      "step": 185000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.502792575695112e-05,
+      "loss": 0.9773,
+      "step": 186000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.49557975890723e-05,
+      "loss": 0.9384,
+      "step": 187000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.488317779179361e-05,
+      "loss": 0.9105,
+      "step": 188000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.481006715927351e-05,
+      "loss": 0.9118,
+      "step": 189000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.473646649103818e-05,
+      "loss": 0.9584,
+      "step": 190000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.46623765919727e-05,
+      "loss": 0.7601,
+      "step": 191000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.458779827231237e-05,
+      "loss": 0.7258,
+      "step": 192000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.451273234763371e-05,
+      "loss": 0.8387,
+      "step": 193000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.443717963884569e-05,
+      "loss": 1.1209,
+      "step": 194000
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 9.43611409721806e-05,
+      "loss": 0.8961,
+      "step": 195000
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 9.428461717918511e-05,
+      "loss": 0.8493,
+      "step": 196000
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 9.420760909671118e-05,
+      "loss": 1.0333,
+      "step": 197000
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 9.413011756690685e-05,
+      "loss": 0.928,
+      "step": 198000
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 9.405214343720707e-05,
+      "loss": 0.9016,
+      "step": 199000
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 9.397368756032445e-05,
+      "loss": 0.9039,
+      "step": 200000
+    },
+    {
+      "epoch": 0.2,
+      "eval_loss": 0.6195229291915894,
+      "eval_runtime": 24.1688,
+      "eval_samples_per_second": 206.878,
+      "eval_steps_per_second": 3.269,
+      "step": 200000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 1.19299796631552e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:be2cc8073a1e189d84d176885c919af30b3b6d68cc715b0e75c9349edea091c7
 size 1346893675

 version https://git-lfs.github.com/spec/v1
+oid sha256:dc050b6b6cea13715c082c4efde1df4eb7f489a44d07d86d55ddcf0803ea7d10
 size 1346893675

runs/Feb25_19-21-23_t1v-n-eeadb94b-w-0/events.out.tfevents.1677352917.t1v-n-eeadb94b-w-0.615717.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aefe1aebac0e8025c620d68dc1ecaa3d19209c3098ec73d83bd2140f5a1314f2
-size 20388

 version https://git-lfs.github.com/spec/v1
+oid sha256:2516320f139f5ebb64cdc6c31161aa5945f0ee016de07dcd90c6f7d4a8007155
+size 28664