Training in progress, step 187816

Browse files

Files changed (7) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +135 -3
pytorch_model.bin +1 -1
runs/Feb07_05-04-07_5214b674e698/events.out.tfevents.1675746342.5214b674e698.342.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dab7c11e32bc742d74bdc97f13f6eba893be4230d872eaecd0689a72f1fc3083
 size 2401461637

 version https://git-lfs.github.com/spec/v1
+oid sha256:a8dc1533667dc1e5d8754a77682404d92df2ed864b7d3231ea835c0fe8164152
 size 2401461637

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3c2991727b803e8a0b02542f03f6557f0258a9e36d172bbf826844685e5c5185
 size 1200739717

 version https://git-lfs.github.com/spec/v1
+oid sha256:e09b26a6cf4f4fcffcf0d3d40bd588e02142cf71d98c403f62ffa3a24a62fd35
 size 1200739717

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a7fc5cf4ee407f42d02567591ae73b57604321015aed2152689ffa91a768c5cd
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:f7abbc3674fcc879cafecbf33145badc8ed83c64ea9c1dd9b26cb200ce8d10b4
 size 14575

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0c9fc3a1a25e64cc5d7eeddd2fe8bdbd04e891f66624bb894c6a839cce384bc5
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:bede8f6a32f621408b9de8844a576e6a3d9ef01c46428875735af558fc7f135c
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.629615304513403,
-  "global_step": 176768,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2142,11 +2142,143 @@
       "learning_rate": 2.4958099035038134e-06,
       "loss": 2.7393,
       "step": 176500
     }
   ],
   "max_steps": 201666,
   "num_train_epochs": 3,
-  "total_flos": 2.0788079286996173e+17,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.793966261045491,
+  "global_step": 187816,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.4958099035038134e-06,
       "loss": 2.7393,
       "step": 176500
+    },
+    {
+      "epoch": 2.63,
+      "learning_rate": 2.446222962720538e-06,
+      "loss": 2.7727,
+      "step": 177000
+    },
+    {
+      "epoch": 2.64,
+      "learning_rate": 2.396636021937263e-06,
+      "loss": 2.736,
+      "step": 177500
+    },
+    {
+      "epoch": 2.65,
+      "learning_rate": 2.3470490811539874e-06,
+      "loss": 2.7546,
+      "step": 178000
+    },
+    {
+      "epoch": 2.66,
+      "learning_rate": 2.297462140370712e-06,
+      "loss": 2.7601,
+      "step": 178500
+    },
+    {
+      "epoch": 2.66,
+      "learning_rate": 2.247875199587437e-06,
+      "loss": 2.7456,
+      "step": 179000
+    },
+    {
+      "epoch": 2.67,
+      "learning_rate": 2.1982882588041614e-06,
+      "loss": 2.76,
+      "step": 179500
+    },
+    {
+      "epoch": 2.68,
+      "learning_rate": 2.1487013180208863e-06,
+      "loss": 2.7396,
+      "step": 180000
+    },
+    {
+      "epoch": 2.69,
+      "learning_rate": 2.099114377237611e-06,
+      "loss": 2.761,
+      "step": 180500
+    },
+    {
+      "epoch": 2.69,
+      "learning_rate": 2.0495274364543354e-06,
+      "loss": 2.7603,
+      "step": 181000
+    },
+    {
+      "epoch": 2.7,
+      "learning_rate": 1.9999404956710603e-06,
+      "loss": 2.7614,
+      "step": 181500
+    },
+    {
+      "epoch": 2.71,
+      "learning_rate": 1.950353554887785e-06,
+      "loss": 2.7638,
+      "step": 182000
+    },
+    {
+      "epoch": 2.71,
+      "learning_rate": 1.9007666141045096e-06,
+      "loss": 2.7806,
+      "step": 182500
+    },
+    {
+      "epoch": 2.72,
+      "learning_rate": 1.8511796733212343e-06,
+      "loss": 2.7561,
+      "step": 183000
+    },
+    {
+      "epoch": 2.73,
+      "learning_rate": 1.801592732537959e-06,
+      "loss": 2.7473,
+      "step": 183500
+    },
+    {
+      "epoch": 2.74,
+      "learning_rate": 1.7520057917546838e-06,
+      "loss": 2.7405,
+      "step": 184000
+    },
+    {
+      "epoch": 2.74,
+      "learning_rate": 1.7024188509714083e-06,
+      "loss": 2.742,
+      "step": 184500
+    },
+    {
+      "epoch": 2.75,
+      "learning_rate": 1.652831910188133e-06,
+      "loss": 2.7387,
+      "step": 185000
+    },
+    {
+      "epoch": 2.76,
+      "learning_rate": 1.6032449694048577e-06,
+      "loss": 2.7681,
+      "step": 185500
+    },
+    {
+      "epoch": 2.77,
+      "learning_rate": 1.5536580286215825e-06,
+      "loss": 2.7599,
+      "step": 186000
+    },
+    {
+      "epoch": 2.77,
+      "learning_rate": 1.504071087838307e-06,
+      "loss": 2.7497,
+      "step": 186500
+    },
+    {
+      "epoch": 2.78,
+      "learning_rate": 1.4544841470550317e-06,
+      "loss": 2.7417,
+      "step": 187000
+    },
+    {
+      "epoch": 2.79,
+      "learning_rate": 1.4048972062717565e-06,
+      "loss": 2.739,
+      "step": 187500
     }
   ],
   "max_steps": 201666,
   "num_train_epochs": 3,
+  "total_flos": 2.2090056412387738e+17,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3c2991727b803e8a0b02542f03f6557f0258a9e36d172bbf826844685e5c5185
 size 1200739717

 version https://git-lfs.github.com/spec/v1
+oid sha256:e09b26a6cf4f4fcffcf0d3d40bd588e02142cf71d98c403f62ffa3a24a62fd35
 size 1200739717

runs/Feb07_05-04-07_5214b674e698/events.out.tfevents.1675746342.5214b674e698.342.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a5e4f0ed5da7d5706ba5011c8ef271d1d10c08c2a0dcb249dc605188bb19cec7
-size 61151

 version https://git-lfs.github.com/spec/v1
+oid sha256:1176956b862393d9e6e40ad4a6cb5dc97a6996dda8497059a0c5e1a17ea27e09
+size 64671