Training in progress, step 192, checkpoint

Files changed (4) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fd22194ae981192953c10bd8c7d7c229d363fe3051c02792c9530080c309db2d
 size 3380768360

 version https://git-lfs.github.com/spec/v1
+oid sha256:87f6f5e2ebebe7cbd36c7fc47902b762d5204ac5267047a39ffe3bae1f31820b
 size 3380768360

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dd7667b7685377e93cb674f532d76551a3a23b1d3a5e2dd6690c6cc456e5c3b4
 size 1757899449

 version https://git-lfs.github.com/spec/v1
+oid sha256:e3c5065690d7c3ac23c095dccfa8c8f644a2710e0edbe735a2a8dc943a9da737
 size 1757899449

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ce07496a37a4ed6b1a548b1e73eeccecc1cf6f60eafddb58dcb81201d88a83bc
 size 1465

 version https://git-lfs.github.com/spec/v1
+oid sha256:378cb8caa1753a27e13f72b6f9313442152b34dacda281ba328c9e010c1b29ab
 size 1465

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -2,9 +2,9 @@
   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.8780487804878048,
   "eval_steps": 30,
-  "global_step": 180,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -315,6 +315,20 @@
       "eval_samples_per_second": 0.291,
       "eval_steps_per_second": 0.073,
       "step": 180
     }
   ],
   "logging_steps": 5,
@@ -329,12 +343,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 1.1783682305701724e+18,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.0,
   "eval_steps": 30,
+  "global_step": 192,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 0.291,
       "eval_steps_per_second": 0.073,
       "step": 180
+    },
+    {
+      "epoch": 1.9303135888501743,
+      "grad_norm": 0.10959440469741821,
+      "learning_rate": 4.55756592088058e-07,
+      "loss": 0.2618,
+      "step": 185
+    },
+    {
+      "epoch": 1.9825783972125435,
+      "grad_norm": 0.07039328664541245,
+      "learning_rate": 6.417464144736208e-08,
+      "loss": 0.2559,
+      "step": 190
     }
   ],
   "logging_steps": 5,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 1.2340088273817969e+18,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null