Training in progress, step 5000

Files changed (13) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:20ab356fa18f110500a5c92dc47dd1e4511f4ece5e195bf6f39801135def9e7a
 size 943333453

 version https://git-lfs.github.com/spec/v1
+oid sha256:2815fe401ec6ed13fa8496b8a130981165e9740f25a9aa0f5046eb298d76e89d
 size 943333453

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e1aace261b8e6cad923ee6661d1c7271017bc8d22f018c02ff43351ce6bc4e31
 size 471708325

 version https://git-lfs.github.com/spec/v1
+oid sha256:43d467d75f3fdef469e5bc56ca1fac1d83e9042d52441105a2d20418fb1a0436
 size 471708325

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7bc19aba973831004a77f20c88b8e3e066a8a55403bc0ad8b246efb14f309ecd
-size 14567

 version https://git-lfs.github.com/spec/v1
+oid sha256:2124064e0e4e5ab159e152ae1f2b839ea342c8916f3940e7326b5af6d56d60f7
+size 14503

last-checkpoint/scaler.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3b3fad2f6fce6a53bcc536267fb713fc98b77d91952cd1de74b585c2aab05034
+size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:586f9b073107d2287ab918b8e3a6c9ec40a7767baa6b65a691f978a7a7ba2ab5
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:856d2b6c50571997ea86916bdeeedeb8e6b238155372c64b4e024237aa1cc790
 size 623

last-checkpoint/tokenizer.json CHANGED Viewed

@@ -2,13 +2,13 @@
   "version": "1.0",
   "truncation": {
     "direction": "Right",
-    "max_length": 4096,
     "strategy": "OnlySecond",
     "stride": 128
   },
   "padding": {
     "strategy": {
-      "Fixed": 4096
     },
     "direction": "Right",
     "pad_to_multiple_of": null,

   "version": "1.0",
   "truncation": {
     "direction": "Right",
+    "max_length": 2048,
     "strategy": "OnlySecond",
     "stride": 128
   },
   "padding": {
     "strategy": {
+      "Fixed": 2048
     },
     "direction": "Right",
     "pad_to_multiple_of": null,

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,32 +1,32 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.008156606851549755,
-  "global_step": 500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.01,
-      "learning_rate": 2.9918433931484505e-05,
-      "loss": 3.6749,
-      "step": 500
     },
     {
-      "epoch": 0.01,
-      "eval_exact_match": 25.56077203964528,
-      "eval_f1": 30.48757258245567,
-      "eval_loss": 2.4391441345214844,
-      "eval_runtime": 1683.1549,
-      "eval_samples_per_second": 6.834,
-      "eval_steps_per_second": 6.834,
-      "step": 500
     }
   ],
-  "max_steps": 183900,
   "num_train_epochs": 3,
-  "total_flos": 1103235145728000.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.16288767266093301,
+  "global_step": 5000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.16,
+      "learning_rate": 2.8373729476153247e-05,
+      "loss": 1.6126,
+      "step": 5000
     },
     {
+      "epoch": 0.16,
+      "eval_exact_match": 68.15336463223787,
+      "eval_f1": 73.98256617857639,
+      "eval_loss": 1.189887523651123,
+      "eval_runtime": 1542.7266,
+      "eval_samples_per_second": 7.463,
+      "eval_steps_per_second": 3.732,
+      "step": 5000
     }
   ],
+  "max_steps": 92088,
   "num_train_epochs": 3,
+  "total_flos": 1.103235145728e+16,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ce3df7dacb746d38927d7b4b5c96e23b1180109e65ab3c5eda16560beab01da4
 size 3439

 version https://git-lfs.github.com/spec/v1
+oid sha256:c1a307dd73542378086e35083774070bcc9254069583647323f4d6017ba44c0d
 size 3439

nbest_predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e1aace261b8e6cad923ee6661d1c7271017bc8d22f018c02ff43351ce6bc4e31
 size 471708325

 version https://git-lfs.github.com/spec/v1
+oid sha256:43d467d75f3fdef469e5bc56ca1fac1d83e9042d52441105a2d20418fb1a0436
 size 471708325

tokenizer.json CHANGED Viewed

@@ -2,13 +2,13 @@
   "version": "1.0",
   "truncation": {
     "direction": "Right",
-    "max_length": 4096,
     "strategy": "OnlySecond",
     "stride": 128
   },
   "padding": {
     "strategy": {
-      "Fixed": 4096
     },
     "direction": "Right",
     "pad_to_multiple_of": null,

   "version": "1.0",
   "truncation": {
     "direction": "Right",
+    "max_length": 2048,
     "strategy": "OnlySecond",
     "stride": 128
   },
   "padding": {
     "strategy": {
+      "Fixed": 2048
     },
     "direction": "Right",
     "pad_to_multiple_of": null,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ce3df7dacb746d38927d7b4b5c96e23b1180109e65ab3c5eda16560beab01da4
 size 3439

 version https://git-lfs.github.com/spec/v1
+oid sha256:c1a307dd73542378086e35083774070bcc9254069583647323f4d6017ba44c0d
 size 3439