Training in progress, step 198864

Browse files

Files changed (7) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +135 -3
pytorch_model.bin +1 -1
runs/Feb07_05-04-07_5214b674e698/events.out.tfevents.1675746342.5214b674e698.342.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a8dc1533667dc1e5d8754a77682404d92df2ed864b7d3231ea835c0fe8164152
 size 2401461637

 version https://git-lfs.github.com/spec/v1
+oid sha256:0cedde736261632f89acf33553d7f1b796fa4666797a76600bc7414afba87e83
 size 2401461637

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e09b26a6cf4f4fcffcf0d3d40bd588e02142cf71d98c403f62ffa3a24a62fd35
 size 1200739717

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c830ba03e87ef89c167a65183788768bf905dc7f4c689fe476c351a7fc9b93b
 size 1200739717

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f7abbc3674fcc879cafecbf33145badc8ed83c64ea9c1dd9b26cb200ce8d10b4
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:dd594782425d26032039a6c2b147e5861095f1958bd2b0f4a2e42679340bff32
 size 14575

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bede8f6a32f621408b9de8844a576e6a3d9ef01c46428875735af558fc7f135c
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:e9febce275791009bb39a3242ecdd95ff1e50bc7a7886ff99da486505feed461
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.793966261045491,
-  "global_step": 187816,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2274,11 +2274,143 @@
       "learning_rate": 1.4048972062717565e-06,
       "loss": 2.739,
       "step": 187500
     }
   ],
   "max_steps": 201666,
   "num_train_epochs": 3,
-  "total_flos": 2.2090056412387738e+17,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.9583172175775787,
+  "global_step": 198864,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.4048972062717565e-06,
       "loss": 2.739,
       "step": 187500
+    },
+    {
+      "epoch": 2.8,
+      "learning_rate": 1.3553102654884812e-06,
+      "loss": 2.7633,
+      "step": 188000
+    },
+    {
+      "epoch": 2.8,
+      "learning_rate": 1.3057233247052057e-06,
+      "loss": 2.7516,
+      "step": 188500
+    },
+    {
+      "epoch": 2.81,
+      "learning_rate": 1.2561363839219304e-06,
+      "loss": 2.7638,
+      "step": 189000
+    },
+    {
+      "epoch": 2.82,
+      "learning_rate": 1.2065494431386552e-06,
+      "loss": 2.7397,
+      "step": 189500
+    },
+    {
+      "epoch": 2.83,
+      "learning_rate": 1.1569625023553797e-06,
+      "loss": 2.7614,
+      "step": 190000
+    },
+    {
+      "epoch": 2.83,
+      "learning_rate": 1.1073755615721044e-06,
+      "loss": 2.7235,
+      "step": 190500
+    },
+    {
+      "epoch": 2.84,
+      "learning_rate": 1.0577886207888292e-06,
+      "loss": 2.7401,
+      "step": 191000
+    },
+    {
+      "epoch": 2.85,
+      "learning_rate": 1.0082016800055539e-06,
+      "loss": 2.7573,
+      "step": 191500
+    },
+    {
+      "epoch": 2.86,
+      "learning_rate": 9.586147392222784e-07,
+      "loss": 2.7452,
+      "step": 192000
+    },
+    {
+      "epoch": 2.86,
+      "learning_rate": 9.090277984390032e-07,
+      "loss": 2.7505,
+      "step": 192500
+    },
+    {
+      "epoch": 2.87,
+      "learning_rate": 8.594408576557279e-07,
+      "loss": 2.7233,
+      "step": 193000
+    },
+    {
+      "epoch": 2.88,
+      "learning_rate": 8.098539168724526e-07,
+      "loss": 2.7409,
+      "step": 193500
+    },
+    {
+      "epoch": 2.89,
+      "learning_rate": 7.602669760891772e-07,
+      "loss": 2.7424,
+      "step": 194000
+    },
+    {
+      "epoch": 2.89,
+      "learning_rate": 7.10680035305902e-07,
+      "loss": 2.7563,
+      "step": 194500
+    },
+    {
+      "epoch": 2.9,
+      "learning_rate": 6.610930945226266e-07,
+      "loss": 2.7478,
+      "step": 195000
+    },
+    {
+      "epoch": 2.91,
+      "learning_rate": 6.115061537393512e-07,
+      "loss": 2.7555,
+      "step": 195500
+    },
+    {
+      "epoch": 2.92,
+      "learning_rate": 5.619192129560759e-07,
+      "loss": 2.7679,
+      "step": 196000
+    },
+    {
+      "epoch": 2.92,
+      "learning_rate": 5.123322721728006e-07,
+      "loss": 2.7219,
+      "step": 196500
+    },
+    {
+      "epoch": 2.93,
+      "learning_rate": 4.6274533138952524e-07,
+      "loss": 2.7283,
+      "step": 197000
+    },
+    {
+      "epoch": 2.94,
+      "learning_rate": 4.131583906062499e-07,
+      "loss": 2.7703,
+      "step": 197500
+    },
+    {
+      "epoch": 2.95,
+      "learning_rate": 3.6357144982297465e-07,
+      "loss": 2.7606,
+      "step": 198000
+    },
+    {
+      "epoch": 2.95,
+      "learning_rate": 3.1398450903969933e-07,
+      "loss": 2.7247,
+      "step": 198500
     }
   ],
   "max_steps": 201666,
   "num_train_epochs": 3,
+  "total_flos": 2.3390721608830157e+17,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e09b26a6cf4f4fcffcf0d3d40bd588e02142cf71d98c403f62ffa3a24a62fd35
 size 1200739717

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c830ba03e87ef89c167a65183788768bf905dc7f4c689fe476c351a7fc9b93b
 size 1200739717

runs/Feb07_05-04-07_5214b674e698/events.out.tfevents.1675746342.5214b674e698.342.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1176956b862393d9e6e40ad4a6cb5dc97a6996dda8497059a0c5e1a17ea27e09
-size 64671

 version https://git-lfs.github.com/spec/v1
+oid sha256:f3418c4d48d9655d66cec7f231aa9eca5c7d2436ae748697c02e220abc2d1378
+size 68191