Training in progress, step 45, checkpoint

Files changed (4) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1e7627d883c62daaa26528ac5de1db758728ffc0e798698cf9dc09e67f3713bd
 size 4628218

 version https://git-lfs.github.com/spec/v1
+oid sha256:6ba4e6f31201d085ea85e641dee81f15497cbec2c4bf4ac956f4b70c6557a22c
 size 4628218

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aeeb1d37c35dddc3499dfa65807e0f1e540a8c757e9ef0700cce98a54ce426b7
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:3cf420d826a76ebf3d18a2641574c572d67f70da8adcccd5dcab567f4430e22d
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e9573e9d18ad7803441c819253e1705231d5811c0e4f29747c0574440f588f00
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:b665a2618254d0693455029a117143eb612684fd8f287fa7207d501afc785521
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.06524694154961486,
   "eval_steps": 9,
-  "global_step": 36,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -96,6 +96,28 @@
       "eval_samples_per_second": 285.366,
       "eval_steps_per_second": 35.78,
       "step": 36
     }
   ],
   "logging_steps": 5,
@@ -115,7 +137,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 647134130995200.0,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.08155867693701857,
   "eval_steps": 9,
+  "global_step": 45,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 285.366,
       "eval_steps_per_second": 35.78,
       "step": 36
+    },
+    {
+      "epoch": 0.07249660172179428,
+      "grad_norm": NaN,
+      "learning_rate": 0.00012803300858899104,
+      "loss": 0.0,
+      "step": 40
+    },
+    {
+      "epoch": 0.08155867693701857,
+      "grad_norm": NaN,
+      "learning_rate": 0.00011666776747647015,
+      "loss": 0.0,
+      "step": 45
+    },
+    {
+      "epoch": 0.08155867693701857,
+      "eval_loss": NaN,
+      "eval_runtime": 6.8846,
+      "eval_samples_per_second": 284.982,
+      "eval_steps_per_second": 35.732,
+      "step": 45
     }
   ],
   "logging_steps": 5,
       "attributes": {}
     }
   },
+  "total_flos": 808917663744000.0,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null