Training in progress, step 900000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Dec27_23-39-04_t1v-n-6071ee6f-w-0/events.out.tfevents.1672184365.t1v-n-6071ee6f-w-0.108001.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:08f951759775273acca27a12ea950a11bbfb4e3e81edcf7e13a2e38e65ad7d75
 size 885325017

 version https://git-lfs.github.com/spec/v1
+oid sha256:afac54dc1a1a42c7a4035ae193ff5de66579579f043c436b6b866c47f6bba3d0
 size 885325017

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:164a1a0c14af3ddfe09b60b80146afabdba18c1085ddf41902e33cae32b815cd
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:b18a077575ed96947212d0f4c33b2f9fc7ee3cf38bd599c6885541f1875f03e7
 size 442675755

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c1785c1e98ae2a8958f65f36a66254a4f1766d0da0b3fd343599a83dea6a88f
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c1785c1e98ae2a8958f65f36a66254a4f1766d0da0b3fd343599a83dea6a88f
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c1785c1e98ae2a8958f65f36a66254a4f1766d0da0b3fd343599a83dea6a88f
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c1785c1e98ae2a8958f65f36a66254a4f1766d0da0b3fd343599a83dea6a88f
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c1785c1e98ae2a8958f65f36a66254a4f1766d0da0b3fd343599a83dea6a88f
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c1785c1e98ae2a8958f65f36a66254a4f1766d0da0b3fd343599a83dea6a88f
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c1785c1e98ae2a8958f65f36a66254a4f1766d0da0b3fd343599a83dea6a88f
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c1785c1e98ae2a8958f65f36a66254a4f1766d0da0b3fd343599a83dea6a88f
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:adedebe0cc7e07de957a9e2967d6e9c3934a9fdca3245f46a29d125e5e36192e
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:98fbf159ce1bb90afdab5d6ac994b4ab633fc21d8eb6c04c41c7f3a26253e5b5
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 5.11979,
-  "global_step": 850000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -5242,11 +5242,319 @@
       "eval_samples_per_second": 485.791,
       "eval_steps_per_second": 3.886,
       "step": 850000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 1.4318651985195172e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 6.023748,
+  "global_step": 900000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 485.791,
       "eval_steps_per_second": 3.886,
       "step": 850000
+    },
+    {
+      "epoch": 5.12,
+      "learning_rate": 5.947856562792925e-06,
+      "loss": 0.6238,
+      "step": 851000
+    },
+    {
+      "epoch": 5.12,
+      "learning_rate": 5.869882433093155e-06,
+      "loss": 0.581,
+      "step": 852000
+    },
+    {
+      "epoch": 5.12,
+      "learning_rate": 5.79239090328883e-06,
+      "loss": 0.6045,
+      "step": 853000
+    },
+    {
+      "epoch": 5.12,
+      "learning_rate": 5.715382820814885e-06,
+      "loss": 0.7161,
+      "step": 854000
+    },
+    {
+      "epoch": 5.12,
+      "learning_rate": 5.6388590278194096e-06,
+      "loss": 0.6942,
+      "step": 855000
+    },
+    {
+      "epoch": 5.13,
+      "learning_rate": 5.562820361154314e-06,
+      "loss": 0.6408,
+      "step": 856000
+    },
+    {
+      "epoch": 5.13,
+      "learning_rate": 5.48726765236629e-06,
+      "loss": 0.5817,
+      "step": 857000
+    },
+    {
+      "epoch": 5.13,
+      "learning_rate": 5.412201727687644e-06,
+      "loss": 0.5988,
+      "step": 858000
+    },
+    {
+      "epoch": 5.13,
+      "learning_rate": 5.337623408027293e-06,
+      "loss": 0.6975,
+      "step": 859000
+    },
+    {
+      "epoch": 5.13,
+      "learning_rate": 5.263533508961827e-06,
+      "loss": 0.7198,
+      "step": 860000
+    },
+    {
+      "epoch": 5.13,
+      "learning_rate": 5.1899328407264855e-06,
+      "loss": 0.628,
+      "step": 861000
+    },
+    {
+      "epoch": 5.13,
+      "learning_rate": 5.116822208206396e-06,
+      "loss": 0.5893,
+      "step": 862000
+    },
+    {
+      "epoch": 5.13,
+      "learning_rate": 5.044202410927706e-06,
+      "loss": 0.5714,
+      "step": 863000
+    },
+    {
+      "epoch": 5.13,
+      "learning_rate": 4.972074243048897e-06,
+      "loss": 0.7271,
+      "step": 864000
+    },
+    {
+      "epoch": 5.13,
+      "learning_rate": 4.900438493352055e-06,
+      "loss": 0.7008,
+      "step": 865000
+    },
+    {
+      "epoch": 5.14,
+      "learning_rate": 4.829295945234258e-06,
+      "loss": 0.6306,
+      "step": 866000
+    },
+    {
+      "epoch": 5.14,
+      "learning_rate": 4.758647376699032e-06,
+      "loss": 0.5751,
+      "step": 867000
+    },
+    {
+      "epoch": 5.14,
+      "learning_rate": 4.688493560347773e-06,
+      "loss": 0.6041,
+      "step": 868000
+    },
+    {
+      "epoch": 5.14,
+      "learning_rate": 4.618835263371396e-06,
+      "loss": 0.7111,
+      "step": 869000
+    },
+    {
+      "epoch": 5.14,
+      "learning_rate": 4.549673247541875e-06,
+      "loss": 0.6979,
+      "step": 870000
+    },
+    {
+      "epoch": 5.14,
+      "learning_rate": 4.48100826920394e-06,
+      "loss": 0.6413,
+      "step": 871000
+    },
+    {
+      "epoch": 5.14,
+      "learning_rate": 4.412841079266777e-06,
+      "loss": 0.5835,
+      "step": 872000
+    },
+    {
+      "epoch": 5.14,
+      "learning_rate": 4.3451724231958644e-06,
+      "loss": 0.5934,
+      "step": 873000
+    },
+    {
+      "epoch": 5.14,
+      "learning_rate": 4.27800304100478e-06,
+      "loss": 0.6971,
+      "step": 874000
+    },
+    {
+      "epoch": 5.14,
+      "learning_rate": 4.2113336672471245e-06,
+      "loss": 0.7208,
+      "step": 875000
+    },
+    {
+      "epoch": 5.15,
+      "learning_rate": 4.145165031008508e-06,
+      "loss": 0.6318,
+      "step": 876000
+    },
+    {
+      "epoch": 6.0,
+      "learning_rate": 4.079497855898501e-06,
+      "loss": 0.5358,
+      "step": 877000
+    },
+    {
+      "epoch": 6.0,
+      "learning_rate": 4.01433286004283e-06,
+      "loss": 0.591,
+      "step": 878000
+    },
+    {
+      "epoch": 6.0,
+      "learning_rate": 3.949670756075447e-06,
+      "loss": 0.627,
+      "step": 879000
+    },
+    {
+      "epoch": 6.0,
+      "learning_rate": 3.885512251130763e-06,
+      "loss": 0.7322,
+      "step": 880000
+    },
+    {
+      "epoch": 6.0,
+      "learning_rate": 3.821858046835913e-06,
+      "loss": 0.6815,
+      "step": 881000
+    },
+    {
+      "epoch": 6.01,
+      "learning_rate": 3.75870883930306e-06,
+      "loss": 0.6143,
+      "step": 882000
+    },
+    {
+      "epoch": 6.01,
+      "learning_rate": 3.696065319121833e-06,
+      "loss": 0.5698,
+      "step": 883000
+    },
+    {
+      "epoch": 6.01,
+      "learning_rate": 3.6339281713517303e-06,
+      "loss": 0.6294,
+      "step": 884000
+    },
+    {
+      "epoch": 6.01,
+      "learning_rate": 3.5722980755146517e-06,
+      "loss": 0.7191,
+      "step": 885000
+    },
+    {
+      "epoch": 6.01,
+      "learning_rate": 3.511175705587433e-06,
+      "loss": 0.7099,
+      "step": 886000
+    },
+    {
+      "epoch": 6.01,
+      "learning_rate": 3.4505617299945336e-06,
+      "loss": 0.6008,
+      "step": 887000
+    },
+    {
+      "epoch": 6.01,
+      "learning_rate": 3.390456811600673e-06,
+      "loss": 0.5644,
+      "step": 888000
+    },
+    {
+      "epoch": 6.01,
+      "learning_rate": 3.3308616077036115e-06,
+      "loss": 0.6293,
+      "step": 889000
+    },
+    {
+      "epoch": 6.01,
+      "learning_rate": 3.271776770026963e-06,
+      "loss": 0.7273,
+      "step": 890000
+    },
+    {
+      "epoch": 6.01,
+      "learning_rate": 3.213202944713023e-06,
+      "loss": 0.703,
+      "step": 891000
+    },
+    {
+      "epoch": 6.02,
+      "learning_rate": 3.155140772315773e-06,
+      "loss": 0.5858,
+      "step": 892000
+    },
+    {
+      "epoch": 6.02,
+      "learning_rate": 3.0975908877938277e-06,
+      "loss": 0.5898,
+      "step": 893000
+    },
+    {
+      "epoch": 6.02,
+      "learning_rate": 3.040553920503503e-06,
+      "loss": 0.6193,
+      "step": 894000
+    },
+    {
+      "epoch": 6.02,
+      "learning_rate": 2.9840304941919415e-06,
+      "loss": 0.7289,
+      "step": 895000
+    },
+    {
+      "epoch": 6.02,
+      "learning_rate": 2.928021226990263e-06,
+      "loss": 0.6799,
+      "step": 896000
+    },
+    {
+      "epoch": 6.02,
+      "learning_rate": 2.8725267314068495e-06,
+      "loss": 0.619,
+      "step": 897000
+    },
+    {
+      "epoch": 6.02,
+      "learning_rate": 2.817547614320615e-06,
+      "loss": 0.5712,
+      "step": 898000
+    },
+    {
+      "epoch": 6.02,
+      "learning_rate": 2.7630844769743757e-06,
+      "loss": 0.627,
+      "step": 899000
+    },
+    {
+      "epoch": 6.02,
+      "learning_rate": 2.7091379149682685e-06,
+      "loss": 0.7135,
+      "step": 900000
+    },
+    {
+      "epoch": 6.02,
+      "eval_loss": 0.4734259843826294,
+      "eval_runtime": 10.2687,
+      "eval_samples_per_second": 486.916,
+      "eval_steps_per_second": 3.895,
+      "step": 900000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 1.5160934549535326e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:164a1a0c14af3ddfe09b60b80146afabdba18c1085ddf41902e33cae32b815cd
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:b18a077575ed96947212d0f4c33b2f9fc7ee3cf38bd599c6885541f1875f03e7
 size 442675755

runs/Dec27_23-39-04_t1v-n-6071ee6f-w-0/events.out.tfevents.1672184365.t1v-n-6071ee6f-w-0.108001.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e52cdc8630d544095f08a1e0936e12cfe05b25bfc9effb63eb623b39cfd3cf76
-size 144425

 version https://git-lfs.github.com/spec/v1
+oid sha256:7d0fda069269738addd33509653420dedbaca74c953cfcb302afb1d12b7a3b42
+size 152701