Training in progress, step 2000, checkpoint

Files changed (12) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0c72cd05b8ea3c2eaa7ec017e827eb1dbbb06336a1c31f8fa34fea733fd8fc3a
 size 627606952

 version https://git-lfs.github.com/spec/v1
+oid sha256:d8b4c290a0473e3f1a83750a409562d823c6df4a1b7a59e78e869dd7ad4ff004
 size 627606952

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6959a3ea2e2996dcb0bd6ccfbbd34b3ebdc17ba9168d3fa8babea98152a16e4a
 size 318985924

 version https://git-lfs.github.com/spec/v1
+oid sha256:757014c53f19b73e429af204a5338d3f14676b7fc2c7966ce939c733cec084fc
 size 318985924

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f1656123ea9f4ccfdf9d2d730280c78325111e6e9e5692bc2f84858ee1c8f00e
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:b579740f0f439f469c486c69eea58de2c5120d23d26733b64db7c7667df71a90
 size 15984

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:becb7369a7ca594132dccc05171d427b0764f614e10dbe1c111bf394e5b3745a
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:f58d40a7f8af25cfc5622dc7ce8236177ec2ab2d63460c9947df6c8985225e32
 size 15984

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73b3a96efb3ed4510e4a056e002c98eac78fbe0baf34c3b554604b6c4b3665ec
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:0f7c278c6bb8d46d099e72f39e89da9bd3a2bc727a0e97053dcb3adc0e3887f4
 size 15984

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e7a51362ccac796c62466a67fd20ccd2abff6705853e1c6dde4d4c505145c021
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:624bc06ceaa4f535ee5bd5523aba308ae079239fd1216a542ff7f206dfe9e0d6
 size 15984

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:05adf40980d62eeb6310d6e8a5a137807e65ef3da23b6284a62e802808e7d470
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:5846dae2a3f5d45e9c6a0d8735dbdf59f88cd724bb5390de8d74fdb0a3570143
 size 15984

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c29ef52520b125f2f9524ec7af2bc737c5ea23d503faa0f52aaebc0df2fdaf62
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:8fd362c0cdd2c0b07695c69ba21a13f79c1271c6cc1f095f8c8f3826affb6f2d
 size 15984

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a1d8e4195a944b0da9dc268731bc5b37bebc575fbf0e4c5c6b8470dd31e47d38
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:bfadb0579f7e6f5845d871b6bdfc6bac7aa6c9d1a062b11d56ebfd5eb6cb6f5f
 size 15984

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2ed45e876d63deb08b4fd5daf0982116d0a8020e63f4387ee514dc6ec947968b
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:665b232df28dd286682f25be6672af0fa77ccef4cdff53c9e9e9243286f09d8b
 size 15984

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2509ad1b6fee1de76d21593e4c061d648f7bbc1435b98bd242ae321a5780dc6f
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:ff620fa731932bfad032c9b2869fcd08718601bc76c1b44cf37971591fc72fbd
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 99.5,
   "eval_steps": 20,
-  "global_step": 1990,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2200,6 +2200,21 @@
       "learning_rate": 1.2486132855826781e-08,
       "loss": 0.0002,
       "step": 1990
     }
   ],
   "logging_steps": 10,
@@ -2214,12 +2229,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 4.18398282448896e+17,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 100.0,
   "eval_steps": 20,
+  "global_step": 2000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.2486132855826781e-08,
       "loss": 0.0002,
       "step": 1990
+    },
+    {
+      "epoch": 100.0,
+      "grad_norm": 0.0007593940244987607,
+      "learning_rate": 0.0,
+      "loss": 0.0002,
+      "step": 2000
+    },
+    {
+      "epoch": 100.0,
+      "eval_loss": 1.9426655769348145,
+      "eval_runtime": 0.396,
+      "eval_samples_per_second": 45.452,
+      "eval_steps_per_second": 7.575,
+      "step": 2000
     }
   ],
   "logging_steps": 10,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 4.205007863808e+17,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null