Training in progress, step 26, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fc64c7aca36b556493920a1579db632d1384c45a36ac185dec3b8e1d4b492c78
 size 390888

 version https://git-lfs.github.com/spec/v1
+oid sha256:ca1040f95c6f7f116c38c2bf7eea8a30f200d211cbf352a6bad03b1af94fc0fa
 size 390888

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:db8b85c338c34db5bcf64595492716fa17a71815ec97d9e7e13c35a583c7b157
 size 819770

 version https://git-lfs.github.com/spec/v1
+oid sha256:0fc2703554c63a96579e1a3220d5c9bfa89139b0a551397d9442451ce0bb0298
 size 819770

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d1702dcc0f9d9a8f9c63e74896356a19749f4963949bab512e43e702fe77962c
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:dff7474c416c2bfd55209bee67ee6bd1d6630537f2cf74fba6d21acac7fd83c4
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c0fc309d4608eca7c1f00c14befe35df8d98572a350ac190aaac790dc1a0befb
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:a5d17cc7d96fbe24ad40a731f4825abc56336860d89f3ac12726fee59c43123c
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.8096385542168675,
   "eval_steps": 6,
-  "global_step": 21,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -53,6 +53,14 @@
       "learning_rate": 1.4644660940672627e-05,
       "loss": 8.7746,
       "step": 20
     }
   ],
   "logging_steps": 10,
@@ -67,12 +75,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 22027670913024.0,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.0313253012048194,
   "eval_steps": 6,
+  "global_step": 26,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.4644660940672627e-05,
       "loss": 8.7746,
       "step": 20
+    },
+    {
+      "epoch": 0.9253012048192771,
+      "eval_loss": 8.70206356048584,
+      "eval_runtime": 0.6614,
+      "eval_samples_per_second": 264.61,
+      "eval_steps_per_second": 33.265,
+      "step": 24
     }
   ],
   "logging_steps": 10,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 27272354463744.0,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null