Training in progress, step 338, checkpoint

Files changed (4) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9fa01b3abb7656551224fc4fbeb611a0886c86685343fa6406fe831c1db71f04
 size 73911112

 version https://git-lfs.github.com/spec/v1
+oid sha256:2b8a3eece0dc302434ef64183cab96e50003409d00c5c3306d0ef88aceb611bd
 size 73911112

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:88fab551c9bf6c469ad35ab513b4416c08bfdf970747a1f23bd5b53582b807c8
 size 37431220

 version https://git-lfs.github.com/spec/v1
+oid sha256:92caf4c36df1978405832c53a74c976a3189649219062536fb762290a417f73e
 size 37431220

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b12f765a366db773a3e801ac0d1a41ae53b843966dba1e15b6484a9f4d83233f
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:5421d489113a06f78cffb8ba158f8a76b5b37f551fb566a3800bdcadd25c598b
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.9245541838134431,
   "eval_steps": 500,
-  "global_step": 337,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2366,6 +2366,13 @@
       "learning_rate": 2.0454545454545457e-05,
       "loss": 1.1601,
       "step": 337
     }
   ],
   "logging_steps": 1,
@@ -2385,7 +2392,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 4.1769332820525466e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.9272976680384087,
   "eval_steps": 500,
+  "global_step": 338,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.0454545454545457e-05,
       "loss": 1.1601,
       "step": 337
+    },
+    {
+      "epoch": 0.9272976680384087,
+      "grad_norm": 0.16423514485359192,
+      "learning_rate": 1.9696969696969697e-05,
+      "loss": 1.1818,
+      "step": 338
     }
   ],
   "logging_steps": 1,
       "attributes": {}
     }
   },
+  "total_flos": 4.18827695165313e+17,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null