Training in progress, step 20, checkpoint

Files changed (6) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0d93e1447df338cb82425c676ee327e29e6ccdf6b0fcb1e6b1e8bcc1b9790a47
 size 1716360444

 version https://git-lfs.github.com/spec/v1
+oid sha256:0a764fbda5943541947f63553e5167c97297a5db349245805e90871ee44ca6af
 size 1716360444

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f9a2844302fb6bb266b84b60df234bff01243f6e34895e273c410eeacbbc97e6
 size 3433062021

 version https://git-lfs.github.com/spec/v1
+oid sha256:806f6f5ab92428f5386186fc63b5907b8b5323c7e6a997d5fc6d431531ef0395
 size 3433062021

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7775cfb857ea8d5dad4e55d621fe6b664e7f7e01b9a13925f47757ea28a71912
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:1518ee95bdd1b49cc70d991bd9aa4565aa12c1bc44f83d5111632402e1671564
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b32c228988998aa7f8c86d4c26da16835ba6d8d022fa594dfdc2c5ed5b7a666
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:c02e795be2005cfb6114b898274cb7b49c620eb2cb7c5e988b220f7aa723b1fc
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.04608294930875576,
   "eval_steps": 100,
-  "global_step": 10,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -14,10 +14,17 @@
       "learning_rate": 4.999735579817769e-05,
       "loss": 1.4008,
       "step": 10
     }
   ],
   "logging_steps": 10,
-  "max_steps": 1085,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 5,
   "save_steps": 10,
@@ -33,7 +40,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 23929694515200.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.09237875288683603,
   "eval_steps": 100,
+  "global_step": 20,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 4.999735579817769e-05,
       "loss": 1.4008,
       "step": 10
+    },
+    {
+      "epoch": 0.09237875288683603,
+      "grad_norm": 2.0704426765441895,
+      "learning_rate": 4.997598371650346e-05,
+      "loss": 1.388,
+      "step": 20
     }
   ],
   "logging_steps": 10,
+  "max_steps": 1080,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 5,
   "save_steps": 10,
       "attributes": {}
     }
   },
+  "total_flos": 47859389030400.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:43d91b1496178ac406352964cea26801514f7d8531618943d63c80852c83fa37
 size 5112

 version https://git-lfs.github.com/spec/v1
+oid sha256:fed09fd527038c16340e2f427d8a40a587733060f6ee64d37fc8b4c4cdfce0b6
 size 5112