Training in progress, step 250000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Dec30_08-05-16_t1v-n-4a21561c-w-0/events.out.tfevents.1672387541.t1v-n-4a21561c-w-0.14765.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ade1b0b7b3f843a27d19a5a7abf28523d1dd1f13694a0a01ed12d2dd44287a10
 size 885325017

 version https://git-lfs.github.com/spec/v1
+oid sha256:06e43a481aa09f133d4bdb1d744a60d7d242924db68aa84b2a04cdf8b3d8a95b
 size 885325017

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fedbde3e4ced89eb99252547c27e574617ab64d9efddc4f95381c1461433e515
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:1ef4eda0da8e2b25fadddf1ff76a7a4bef8f712fdd552bff59bb80a072360cc0
 size 442675755

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31471c836416c0a11bf9f5d56b4929469fb07edd9fc2db01c46541cb396ecb6b
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:16ce1b7c1cb402e7a68141ff41519d1e3232f0eb41367c240aac2ab72667cdbd
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31471c836416c0a11bf9f5d56b4929469fb07edd9fc2db01c46541cb396ecb6b
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:16ce1b7c1cb402e7a68141ff41519d1e3232f0eb41367c240aac2ab72667cdbd
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31471c836416c0a11bf9f5d56b4929469fb07edd9fc2db01c46541cb396ecb6b
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:16ce1b7c1cb402e7a68141ff41519d1e3232f0eb41367c240aac2ab72667cdbd
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31471c836416c0a11bf9f5d56b4929469fb07edd9fc2db01c46541cb396ecb6b
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:16ce1b7c1cb402e7a68141ff41519d1e3232f0eb41367c240aac2ab72667cdbd
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31471c836416c0a11bf9f5d56b4929469fb07edd9fc2db01c46541cb396ecb6b
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:16ce1b7c1cb402e7a68141ff41519d1e3232f0eb41367c240aac2ab72667cdbd
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31471c836416c0a11bf9f5d56b4929469fb07edd9fc2db01c46541cb396ecb6b
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:16ce1b7c1cb402e7a68141ff41519d1e3232f0eb41367c240aac2ab72667cdbd
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31471c836416c0a11bf9f5d56b4929469fb07edd9fc2db01c46541cb396ecb6b
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:16ce1b7c1cb402e7a68141ff41519d1e3232f0eb41367c240aac2ab72667cdbd
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31471c836416c0a11bf9f5d56b4929469fb07edd9fc2db01c46541cb396ecb6b
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:16ce1b7c1cb402e7a68141ff41519d1e3232f0eb41367c240aac2ab72667cdbd
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:be1ccf49f4804619cd7d22b74b595a694a368e629a10492b4089d6536d07bdf2
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:7924e9d3f9ed054868d3ddaa60025f26707d231e7eacc5684e8550acfee9e9c0
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.055709,
-  "global_step": 200000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1238,11 +1238,319 @@
       "eval_samples_per_second": 393.967,
       "eval_steps_per_second": 3.152,
       "step": 200000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 3.3690839325144515e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.105709,
+  "global_step": 250000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 393.967,
       "eval_steps_per_second": 3.152,
       "step": 200000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 9.389475079423988e-05,
+      "loss": 0.6848,
+      "step": 201000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 9.381533400219318e-05,
+      "loss": 0.6762,
+      "step": 202000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 9.373543805267368e-05,
+      "loss": 0.6713,
+      "step": 203000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 9.365506381941066e-05,
+      "loss": 0.6702,
+      "step": 204000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 9.357421218136386e-05,
+      "loss": 0.669,
+      "step": 205000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 9.349288402271388e-05,
+      "loss": 0.6691,
+      "step": 206000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 9.341108023285238e-05,
+      "loss": 0.6799,
+      "step": 207000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 9.332880170637252e-05,
+      "loss": 0.6795,
+      "step": 208000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 9.32460493430591e-05,
+      "loss": 0.6777,
+      "step": 209000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 9.316282404787871e-05,
+      "loss": 0.6798,
+      "step": 210000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 9.30791267309698e-05,
+      "loss": 0.6833,
+      "step": 211000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 9.299495830763286e-05,
+      "loss": 0.6728,
+      "step": 212000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 9.291031969832026e-05,
+      "loss": 0.6679,
+      "step": 213000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 9.282521182862629e-05,
+      "loss": 0.6658,
+      "step": 214000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 9.273963562927695e-05,
+      "loss": 0.6638,
+      "step": 215000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 9.265359203611987e-05,
+      "loss": 0.6661,
+      "step": 216000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 9.256708199011401e-05,
+      "loss": 0.6779,
+      "step": 217000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 9.248010643731935e-05,
+      "loss": 0.6775,
+      "step": 218000
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 9.239266632888659e-05,
+      "loss": 0.6746,
+      "step": 219000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 9.230476262104677e-05,
+      "loss": 0.6758,
+      "step": 220000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 9.221639627510076e-05,
+      "loss": 0.6801,
+      "step": 221000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 9.212756825740873e-05,
+      "loss": 0.6689,
+      "step": 222000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 9.20382795393797e-05,
+      "loss": 0.6653,
+      "step": 223000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 9.194853109746074e-05,
+      "loss": 0.6629,
+      "step": 224000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 9.185832391312644e-05,
+      "loss": 0.6632,
+      "step": 225000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 9.176765897286813e-05,
+      "loss": 0.6629,
+      "step": 226000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 9.167653726818305e-05,
+      "loss": 0.6735,
+      "step": 227000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 9.158495979556358e-05,
+      "loss": 0.6748,
+      "step": 228000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 9.14929275564863e-05,
+      "loss": 0.6708,
+      "step": 229000
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 9.140044155740101e-05,
+      "loss": 0.6706,
+      "step": 230000
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 9.130750280971978e-05,
+      "loss": 0.6768,
+      "step": 231000
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 9.121411232980588e-05,
+      "loss": 0.664,
+      "step": 232000
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 9.112027113896262e-05,
+      "loss": 0.6614,
+      "step": 233000
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 9.102598026342222e-05,
+      "loss": 0.6577,
+      "step": 234000
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 9.093124073433463e-05,
+      "loss": 0.659,
+      "step": 235000
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 9.083605358775612e-05,
+      "loss": 0.6601,
+      "step": 236000
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 9.074041986463808e-05,
+      "loss": 0.6667,
+      "step": 237000
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 9.064434061081562e-05,
+      "loss": 0.6685,
+      "step": 238000
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 9.0547816876996e-05,
+      "loss": 0.6658,
+      "step": 239000
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 9.045084971874738e-05,
+      "loss": 0.6694,
+      "step": 240000
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 9.035344019648702e-05,
+      "loss": 0.6737,
+      "step": 241000
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 9.025558937546988e-05,
+      "loss": 0.6588,
+      "step": 242000
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 9.015729832577681e-05,
+      "loss": 0.6577,
+      "step": 243000
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 9.005856812230304e-05,
+      "loss": 0.6542,
+      "step": 244000
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 8.995939984474624e-05,
+      "loss": 0.6518,
+      "step": 245000
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 8.98597945775948e-05,
+      "loss": 0.6569,
+      "step": 246000
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 8.975975341011596e-05,
+      "loss": 0.6675,
+      "step": 247000
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 8.965927743634391e-05,
+      "loss": 0.6672,
+      "step": 248000
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 8.955836775506776e-05,
+      "loss": 0.6621,
+      "step": 249000
+    },
+    {
+      "epoch": 1.11,
+      "learning_rate": 8.945702546981969e-05,
+      "loss": 0.6677,
+      "step": 250000
+    },
+    {
+      "epoch": 1.11,
+      "eval_loss": 0.4477137625217438,
+      "eval_runtime": 11.1571,
+      "eval_samples_per_second": 448.145,
+      "eval_steps_per_second": 3.585,
+      "step": 250000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 4.2113538628056515e+18,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fedbde3e4ced89eb99252547c27e574617ab64d9efddc4f95381c1461433e515
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:1ef4eda0da8e2b25fadddf1ff76a7a4bef8f712fdd552bff59bb80a072360cc0
 size 442675755

runs/Dec30_08-05-16_t1v-n-4a21561c-w-0/events.out.tfevents.1672387541.t1v-n-4a21561c-w-0.14765.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a9bf2675a56b0f10e10219ddf24c44b9932ac21c9ddb7616ff45b5c9a88efd55
-size 36837

 version https://git-lfs.github.com/spec/v1
+oid sha256:05d76e89d8ec1543565fc88bd7054e0b38b6d4bb0712febddeaef7d04bae07cb
+size 45113