Training in progress, step 251, checkpoint

Files changed (4) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2691407e9db6ae21000dc87e08d0d8fb548f1923503f90b92ad086b54d974ae1
 size 73911112

 version https://git-lfs.github.com/spec/v1
+oid sha256:51d670e3d79bfffb5e042b5a3ce721b3dac237b5e9f862d93b021230929bd440
 size 73911112

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c9e099b5fc649b11d8e4b894d2342b1318a4c832ef77fe234061bd70729796e8
 size 37430836

 version https://git-lfs.github.com/spec/v1
+oid sha256:92c4b9a1038c3864c6aebfb5f80fb47be5cb30b63f2ac18316cd50f58f7c5813
 size 37430836

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a105afde5a3c32763bae234182a757cc9ea379a36da56361598dedb244c2ffd5
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:7657b3ddb2232aa8012a32fb00c3fb92277ec0be13fceb0c90bdaa595cabccac
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.6858710562414266,
   "eval_steps": 500,
-  "global_step": 250,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1757,6 +1757,13 @@
       "learning_rate": 8.636363636363637e-05,
       "loss": 1.1622,
       "step": 250
     }
   ],
   "logging_steps": 1,
@@ -1776,7 +1783,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 3.0922878573950976e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.6886145404663924,
   "eval_steps": 500,
+  "global_step": 251,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 8.636363636363637e-05,
       "loss": 1.1622,
       "step": 250
+    },
+    {
+      "epoch": 0.6886145404663924,
+      "grad_norm": 0.16669955849647522,
+      "learning_rate": 8.560606060606061e-05,
+      "loss": 1.1737,
+      "step": 251
     }
   ],
   "logging_steps": 1,
       "attributes": {}
     }
   },
+  "total_flos": 3.1050607333850726e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null