End of training

Files changed (5) hide show

all_results.json CHANGED Viewed

@@ -1,8 +1,11 @@
 {
     "epoch": 2.0,
-    "train_loss": 0.21116681609834945,
-    "train_runtime": 5.9654,
     "train_samples": 100,
-    "train_samples_per_second": 33.527,
-    "train_steps_per_second": 2.347
 }

 {
     "epoch": 2.0,
+    "eval_exact_match": 0.0,
+    "eval_f1": 13.633333333333333,
+    "eval_samples": 100,
+    "train_loss": 0.28480225572219264,
+    "train_runtime": 22.8013,
     "train_samples": 100,
+    "train_samples_per_second": 8.771,
+    "train_steps_per_second": 1.14
 }

eval_results.json ADDED Viewed

+{
+    "epoch": 2.0,
+    "eval_exact_match": 0.0,
+    "eval_f1": 13.633333333333333,
+    "eval_samples": 100
+}

runs/Oct06_18-45-10_g3032/events.out.tfevents.1665107227.g3032.570.2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:38e4976d489defd121c3c2fb9296ff25e3b94943d507399266eaf7a5de352613
+size 188

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 2.0,
-    "train_loss": 0.21116681609834945,
-    "train_runtime": 5.9654,
     "train_samples": 100,
-    "train_samples_per_second": 33.527,
-    "train_steps_per_second": 2.347
 }

 {
     "epoch": 2.0,
+    "train_loss": 0.28480225572219264,
+    "train_runtime": 22.8013,
     "train_samples": 100,
+    "train_samples_per_second": 8.771,
+    "train_steps_per_second": 1.14
 }

trainer_state.json CHANGED Viewed

@@ -2,28 +2,40 @@
   "best_metric": null,
   "best_model_checkpoint": null,
   "epoch": 2.0,
-  "global_step": 14,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 1.43,
-      "learning_rate": 8.571428571428571e-06,
-      "loss": 0.2568,
       "step": 10
     },
     {
       "epoch": 2.0,
-      "step": 14,
       "total_flos": 60973645824000.0,
-      "train_loss": 0.21116681609834945,
-      "train_runtime": 5.9654,
-      "train_samples_per_second": 33.527,
-      "train_steps_per_second": 2.347
     }
   ],
-  "max_steps": 14,
   "num_train_epochs": 2,
   "total_flos": 60973645824000.0,
   "trial_name": null,

   "best_metric": null,
   "best_model_checkpoint": null,
   "epoch": 2.0,
+  "global_step": 26,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.77,
+      "learning_rate": 1.8461538461538465e-05,
+      "loss": 0.5091,
       "step": 10
     },
+    {
+      "epoch": 1.54,
+      "learning_rate": 6.923076923076923e-06,
+      "loss": 0.1673,
+      "step": 20
+    },
+    {
+      "epoch": 1.54,
+      "eval_exact_match": 0.0,
+      "eval_f1": 15.883333333333333,
+      "step": 20
+    },
     {
       "epoch": 2.0,
+      "step": 26,
       "total_flos": 60973645824000.0,
+      "train_loss": 0.28480225572219264,
+      "train_runtime": 22.8013,
+      "train_samples_per_second": 8.771,
+      "train_steps_per_second": 1.14
     }
   ],
+  "max_steps": 26,
   "num_train_epochs": 2,
   "total_flos": 60973645824000.0,
   "trial_name": null,