Training in progress, step 10000

Files changed (9) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2815fe401ec6ed13fa8496b8a130981165e9740f25a9aa0f5046eb298d76e89d
 size 943333453

 version https://git-lfs.github.com/spec/v1
+oid sha256:33ad74f665a3348bf6d5e3ed299f7d4a7b088b85d5bec7ac115386ab6edda94f
 size 943333453

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:43d467d75f3fdef469e5bc56ca1fac1d83e9042d52441105a2d20418fb1a0436
 size 471708325

 version https://git-lfs.github.com/spec/v1
+oid sha256:4ca5b7f87f157eff6693ee1f1169b77aa22b7f8a1f4a26872e93b75338ac3e77
 size 471708325

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2124064e0e4e5ab159e152ae1f2b839ea342c8916f3940e7326b5af6d56d60f7
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:d45aeed5414b04020f4a5838ded6cc7c6a982ebbcb1218c96b18a1d5d9638300
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3b3fad2f6fce6a53bcc536267fb713fc98b77d91952cd1de74b585c2aab05034
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:68acf919319a139013fd82fcbfd6c4d169e0a48d6ea3e7014b7221b66195f3c9
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:856d2b6c50571997ea86916bdeeedeb8e6b238155372c64b4e024237aa1cc790
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:b53d49cf7f37049401f5c9ba25adfe57342376a940b10cb055a010720a691d14
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.16288767266093301,
-  "global_step": 5000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -22,11 +22,27 @@
       "eval_samples_per_second": 7.463,
       "eval_steps_per_second": 3.732,
       "step": 5000
     }
   ],
   "max_steps": 92088,
   "num_train_epochs": 3,
-  "total_flos": 1.103235145728e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.32577534532186603,
+  "global_step": 10000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 7.463,
       "eval_steps_per_second": 3.732,
       "step": 5000
+    },
+    {
+      "epoch": 0.33,
+      "learning_rate": 2.674550430023456e-05,
+      "loss": 1.1965,
+      "step": 10000
+    },
+    {
+      "epoch": 0.33,
+      "eval_exact_match": 75.13475917231786,
+      "eval_f1": 79.95184555682803,
+      "eval_loss": 0.9056070446968079,
+      "eval_runtime": 1533.9546,
+      "eval_samples_per_second": 7.505,
+      "eval_steps_per_second": 3.753,
+      "step": 10000
     }
   ],
   "max_steps": 92088,
   "num_train_epochs": 3,
+  "total_flos": 2.206470291456e+16,
   "trial_name": null,
   "trial_params": null
 }

nbest_predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:43d467d75f3fdef469e5bc56ca1fac1d83e9042d52441105a2d20418fb1a0436
 size 471708325

 version https://git-lfs.github.com/spec/v1
+oid sha256:4ca5b7f87f157eff6693ee1f1169b77aa22b7f8a1f4a26872e93b75338ac3e77
 size 471708325