Training in progress, step 113, checkpoint

Files changed (4) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:462e144bcab7491a70358c1f4a875b6c27d67b6cc92caed5a4e5742768be49ed
 size 73911112

 version https://git-lfs.github.com/spec/v1
+oid sha256:c529a85454a3d96a5940fa5d781d9577b35d06f3dc016844d7b8b300f297013a
 size 73911112

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:83c6c05071edf86108c1c7cf96712e1797e3856536617579a4fd809cd5d683ff
 size 37430836

 version https://git-lfs.github.com/spec/v1
+oid sha256:ebe248069e09f4931f12d918e0d5b47cbf7e6f6c3a440eed76b31cd6eacbb695
 size 37430836

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:52d52fc2543a3ca6e1f42845f53001bf363359931a890c3cf7363ae9b686adbc
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:74a8f3454c415665d0358e152faea0ef684bc7b623fa35ef64763c0af976fed2
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.3045267489711934,
   "eval_steps": 500,
-  "global_step": 111,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -784,6 +784,20 @@
       "learning_rate": 0.00019166666666666667,
       "loss": 1.2829,
       "step": 111
     }
   ],
   "logging_steps": 1,
@@ -803,7 +817,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 1.3736075613985997e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.3100137174211248,
   "eval_steps": 500,
+  "global_step": 113,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00019166666666666667,
       "loss": 1.2829,
       "step": 111
+    },
+    {
+      "epoch": 0.30727023319615915,
+      "grad_norm": 0.12115694582462311,
+      "learning_rate": 0.00019090909090909092,
+      "loss": 1.3109,
+      "step": 112
+    },
+    {
+      "epoch": 0.3100137174211248,
+      "grad_norm": 0.12799453735351562,
+      "learning_rate": 0.00019015151515151517,
+      "loss": 1.2836,
+      "step": 113
     }
   ],
   "logging_steps": 1,
       "attributes": {}
     }
   },
+  "total_flos": 1.4010395508772454e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null