Training in progress, step 10, checkpoint

Files changed (12) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:009435752cba422c5e8cbaf14d90b8c439ea6b7fd0dc7358e968cc0a4b9122f3
 size 50503544

 version https://git-lfs.github.com/spec/v1
+oid sha256:550f93216f0b5f3fdf4bf2efe0f7225b795fc220a07384321b81741105d9e069
 size 50503544

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:97081d766c1efd083986e7037f3441e71755761df25e179dc3334cdf6088b140
 size 25986148

 version https://git-lfs.github.com/spec/v1
+oid sha256:cbe3a8b2e24fdc50dfe38d273f9deaf75d4da9a207f66628d6a977773660e828
 size 25986148

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0f50d1f2a647ab66bf93520813e13396221f342eeb0033fac7d886683239dbca
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:22ff52b36e238ec8c5e0ae77ac3a583321bf95dd765824a123fa18ceebc689e0
 size 15984

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8066cf8d591755892e9112cdbf2b6cedcdc6a2248abd6ea2145bf28de0d8d85f
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:5b4c9435b0b42cc713eea6ce123a4d1aaa03f4cdaabf4128ab6be48043d8bc62
 size 15984

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2ecffe7252c8c9baeec2930898096ca83078383402ee33b5b0186d53d3b0ca53
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:ff2e2aa09dba491989d2e653b5122858cda9732d0dc8bda6aad86d87f1fcf803
 size 15984

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4612ac416d87f114d4517611323e4353adc5c12edfd9a825bfd49510f2c555e7
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:ab66a9e238747970935c296838109efc33d576c0992707e87ca257f11ab75f6e
 size 15984

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:87a58c8092333296a66f332b13e3b0089eabe239eaa24306cbe2a62602f3ecdf
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:f8ab3b4e07057099d0e9661e1108f2c94b4126ad0ab0c44ca9af6bb3bd2b9917
 size 15984

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1fabd0190b381df37676269268d272e959c191aa77066c59eec355ac0d052d21
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:93d9cfb36627643297556d68c2fd167c699a88be208868dcbda74b3ac3776f89
 size 15984

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3ce7d88d0986f2975640fe8d0812c75f9e9b7879cde5110f70aad32b8c02d3be
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:93cbba61e44f8fd9c87c04ea2cdc110c1935c7ab4cc89cedce4b353e290f89c1
 size 15984

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aff709ea200ea8eb08d4178c7dddb1a3a3a68d69709bda0ce59028a7312d1c52
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:265760fe9788697ec3bf61fb178eb21105e6530a3fc23196bb8dddc8fa2ea6db
 size 15984

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8bdda546a1390be3b85a90dd4ef31050dfb7b691765ffc12ed691b6786ed6e3d
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:26a93b2a1f4b5368650119fe6e0d6eec6d19cda6badeba4d21943ab48964fa00
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.02102803738317757,
   "eval_steps": 3,
-  "global_step": 9,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -102,6 +102,13 @@
       "eval_samples_per_second": 118.252,
       "eval_steps_per_second": 14.925,
       "step": 9
     }
   ],
   "logging_steps": 1,
@@ -116,12 +123,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 7411455158648832.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.02336448598130841,
   "eval_steps": 3,
+  "global_step": 10,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 118.252,
       "eval_steps_per_second": 14.925,
       "step": 9
+    },
+    {
+      "epoch": 0.02336448598130841,
+      "grad_norm": 0.48678022623062134,
+      "learning_rate": 0.00016,
+      "loss": 1.6706,
+      "step": 10
     }
   ],
   "logging_steps": 1,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 8234950176276480.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null