Training in progress, step 35000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9dfb8ee546a393cbd088a1267e0528b64ac1f6edc55a139ae628e0fae50bc81f
 size 402587859

 version https://git-lfs.github.com/spec/v1
+oid sha256:a6a5a7674dbb8d58ec4d7b340f1e19ce8cd6e355cf21b578954983287a8734b6
 size 402587859

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:552e7d2fc0351ff5002d604566f010c93ce9e53db2a7a86ba323848706c62524
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:2677cfed78ccae5496a895d92941064711c7091014942cb86f552eaa9b73b86b
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b5cf95a496e0d0c153b9cfd4e8a1f7162ed59c2414c99c7838d29cd8f942ca48
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:a2084cf08b52c1263f45bb8b8d4f65131103615cabf4896bf98de710a4ca1760
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f9035eb22871e934ea2071d3c37031d3b68bc4ca9c57bb37af510e052600d5a2
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:668b3257e9fcad50addd96ee800eedbd732b610a370bd832008ee3ea4b26fb8e
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f37c6f1bf46d4683c647937edd88a5957adcf809e2ade87bcd816e5a9ad05c40
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:e83414b6fee779cf5d18e0d6de9bcb0d6baea757a03c57176cc09bb4cd38cf3d
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:70c5619b7d22e67fa4d8ad8e5aac6be8872972633f6b700f4285106349937d54
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:b0a9889c36f8cea70cf9f3a51e8e629fdb3421f3d44d2e389fe9d24a271ed606
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f7facac06cf47f02915a64f3844ee1569b5a7479cd81db3f11a1da1896148a4d
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:946d977aec6ac3e6d969a438e59b6cba069f78c02c4d887419131bdbe7403a10
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5b2ecce13783d3eb66c2381b219fe80ea60a6817507cb21aea863465c4774335
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:a0991d8986307506ff20d1a384de1955fdf6c7f066139da3ee7c2fdbb8b4f5ce
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.5106339520514719,
-  "global_step": 30000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -366,6 +366,66 @@
       "learning_rate": 0.00014876101394745023,
       "loss": 0.3747,
       "step": 30000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.5957396107267172,
+  "global_step": 35000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00014876101394745023,
       "loss": 0.3747,
       "step": 30000
+    },
+    {
+      "epoch": 0.52,
+      "learning_rate": 0.00014871948232026222,
+      "loss": 0.3741,
+      "step": 30500
+    },
+    {
+      "epoch": 0.53,
+      "learning_rate": 0.00014867727245952692,
+      "loss": 0.3739,
+      "step": 31000
+    },
+    {
+      "epoch": 0.54,
+      "learning_rate": 0.00014863447123337502,
+      "loss": 0.3736,
+      "step": 31500
+    },
+    {
+      "epoch": 0.54,
+      "learning_rate": 0.00014859090751637814,
+      "loss": 0.3733,
+      "step": 32000
+    },
+    {
+      "epoch": 0.55,
+      "learning_rate": 0.00014854666683481534,
+      "loss": 0.3728,
+      "step": 32500
+    },
+    {
+      "epoch": 0.56,
+      "learning_rate": 0.0001485017496253243,
+      "loss": 0.3725,
+      "step": 33000
+    },
+    {
+      "epoch": 0.57,
+      "learning_rate": 0.00014845624819224238,
+      "loss": 0.3722,
+      "step": 33500
+    },
+    {
+      "epoch": 0.58,
+      "learning_rate": 0.00014840998061432743,
+      "loss": 0.3719,
+      "step": 34000
+    },
+    {
+      "epoch": 0.59,
+      "learning_rate": 0.00014836313241655734,
+      "loss": 0.3717,
+      "step": 34500
+    },
+    {
+      "epoch": 0.6,
+      "learning_rate": 0.00014831551629313194,
+      "loss": 0.3711,
+      "step": 35000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:552e7d2fc0351ff5002d604566f010c93ce9e53db2a7a86ba323848706c62524
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:2677cfed78ccae5496a895d92941064711c7091014942cb86f552eaa9b73b86b
 size 201355195