Training in progress, step 15000

Files changed (9) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:33ad74f665a3348bf6d5e3ed299f7d4a7b088b85d5bec7ac115386ab6edda94f
 size 943333453

 version https://git-lfs.github.com/spec/v1
+oid sha256:d7ce6f47f0b535e3c17cf93424dcb27acff863da3bee507ab09fd792b5441dce
 size 943333453

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4ca5b7f87f157eff6693ee1f1169b77aa22b7f8a1f4a26872e93b75338ac3e77
 size 471708325

 version https://git-lfs.github.com/spec/v1
+oid sha256:936c68f355516686acc9fd8569ff44fad57e40ebab35445a8e00a909274717d0
 size 471708325

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d45aeed5414b04020f4a5838ded6cc7c6a982ebbcb1218c96b18a1d5d9638300
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:7d26e5aedc9783fd5b42389903a55518c26dc435542e82c46eab02c99a9e3e04
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:68acf919319a139013fd82fcbfd6c4d169e0a48d6ea3e7014b7221b66195f3c9
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:320e7103d68ac581e0918aaf471171063cef4a15a2322663039e70f087daa791
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b53d49cf7f37049401f5c9ba25adfe57342376a940b10cb055a010720a691d14
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:6b00fc05a490426638de1c3614fb5c6f7749b64a69fbff99c5dbd21e1e76058a
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.32577534532186603,
-  "global_step": 10000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -38,11 +38,27 @@
       "eval_samples_per_second": 7.505,
       "eval_steps_per_second": 3.753,
       "step": 10000
     }
   ],
   "max_steps": 92088,
   "num_train_epochs": 3,
-  "total_flos": 2.206470291456e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.48866301798279904,
+  "global_step": 15000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 7.505,
       "eval_steps_per_second": 3.753,
       "step": 10000
+    },
+    {
+      "epoch": 0.49,
+      "learning_rate": 2.511695334897055e-05,
+      "loss": 1.0769,
+      "step": 15000
+    },
+    {
+      "epoch": 0.49,
+      "eval_exact_match": 77.56042427403929,
+      "eval_f1": 82.22503770504048,
+      "eval_loss": 0.9495312571525574,
+      "eval_runtime": 1533.818,
+      "eval_samples_per_second": 7.506,
+      "eval_steps_per_second": 3.753,
+      "step": 15000
     }
   ],
   "max_steps": 92088,
   "num_train_epochs": 3,
+  "total_flos": 3.309705437184e+16,
   "trial_name": null,
   "trial_params": null
 }

nbest_predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4ca5b7f87f157eff6693ee1f1169b77aa22b7f8a1f4a26872e93b75338ac3e77
 size 471708325

 version https://git-lfs.github.com/spec/v1
+oid sha256:936c68f355516686acc9fd8569ff44fad57e40ebab35445a8e00a909274717d0
 size 471708325