Training in progress, step 3500

Files changed (8) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:800ce167b888c1555ce149731d7bc2c753c37b67d31170fb09caffc5792b1e4e
 size 880446181

 version https://git-lfs.github.com/spec/v1
+oid sha256:633117411df249b67810ce444bf3fb43946a8cd66899354347e95f320178ff8d
 size 880446181

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc8e99aaece0e5506cc318f72aba485312ecdd92d231f7a6abf4c66a19db2012
 size 440235825

 version https://git-lfs.github.com/spec/v1
+oid sha256:89123e2ca1e8f73e8549d0b72898b6506a9d8cab0ca3f0ddf2851992906d3212
 size 440235825

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cfa290a26b1da9a46696e39d6f59c27396a70c365e5a24ca8436eb906badd239
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:a8af43f49c567fc21216a636a0b928ad3f2b478713872cde9fab7fd2e5b3bd94
 size 14503

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:98dfa5e5e97bb43603b1e5dcc06c796459aa988da669f9bb10ae35ce686b5186
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:52671e748af9f02c099fe74fa17abb19dd5557da6aa5f91f903c19df101db345
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.3124349093938763,
-  "global_step": 3000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -102,11 +102,27 @@
       "eval_samples_per_second": 92.093,
       "eval_steps_per_second": 11.514,
       "step": 3000
     }
   ],
   "max_steps": 28806,
   "num_train_epochs": 3,
-  "total_flos": 6271122161664000.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.36450739429285567,
+  "global_step": 3500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 92.093,
       "eval_steps_per_second": 11.514,
       "step": 3000
+    },
+    {
+      "epoch": 0.36,
+      "learning_rate": 2.6354926057071445e-05,
+      "loss": 0.8375,
+      "step": 3500
+    },
+    {
+      "epoch": 0.36,
+      "eval_exact_match": 63.82368283776734,
+      "eval_f1": 68.19581427410363,
+      "eval_loss": 0.7115561366081238,
+      "eval_runtime": 154.7006,
+      "eval_samples_per_second": 91.822,
+      "eval_steps_per_second": 11.48,
+      "step": 3500
     }
   ],
   "max_steps": 28806,
   "num_train_epochs": 3,
+  "total_flos": 7316309188608000.0,
   "trial_name": null,
   "trial_params": null
 }

nbest_predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc8e99aaece0e5506cc318f72aba485312ecdd92d231f7a6abf4c66a19db2012
 size 440235825

 version https://git-lfs.github.com/spec/v1
+oid sha256:89123e2ca1e8f73e8549d0b72898b6506a9d8cab0ca3f0ddf2851992906d3212
 size 440235825