Training in progress, step 390000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:18de3f7cc4a91ac6868744a9cd20f39edaebacb5665b74cf4f2175021a0edb90
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:fee40aa1a6fbacfee552fffa429a1bb6a6bbe0587a8c00ceeeb72d56fcc5491b
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c7132bd452806a1828ae1699a118b9aa68caeae454b47d624252df8772b23b65
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:b03a99e1730ed0b4ad5c89ac4a80049122fe9a7b433c61647b26278b007fbb43
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:53e62c4c1922f2a1587e8d53c73b96e423282fb6d6259d9ca0f71ac25e5e8153
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:ba2482f8cf2440cec0254d5988cce37640442e59f079fb17bd6bcd415e99bcb1
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:10f7532403f5b493736d56d3ea7cc99fbf67e90d193efeb30456688505225f32
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:d70e0b0c79d2fa6d6a28c01c5bc090995fd291533a40cd841db17d67210ae78a
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a4e2f6272d55d9d66dae051add9b1254b4bef8eb2c18fe3b5027696d129a3821
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:9a3fc66b05c070cd63ffd00ff8eb77c5a4d2302ca4f6995b3280fe94d5663ac9
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:28a933ecd96bcb0ef9d59cde72c7a2f327911f311001e588d3f029f5f85e1a29
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:8bacc9e2fc4f21f22254517223c74cdcb7c52a6a0ffca9793eaf062a0287de1d
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0634118a00ed086ccf276fc79772adc912101484932dd3c63dd24fd9eb2718ce
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:684e728a687523626e6715432733611e4b4256378736ca4bcaa27753a07851d5
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:468447bff0f0da8cbb0e93720be4efb28f0be877ee6d17ac6e3f1416931c3f00
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:4e66e0b2e2c0276f2bbbbb229f2d3a165b984c5fe5faf07983c7e165b1a34186
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 6.553186781389095,
-  "global_step": 385000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -4626,6 +4626,66 @@
       "learning_rate": 2.753587746225503e-05,
       "loss": 0.3208,
       "step": 385000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 6.6382924400643395,
+  "global_step": 390000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.753587746225503e-05,
       "loss": 0.3208,
       "step": 385000
+    },
+    {
+      "epoch": 6.56,
+      "learning_rate": 2.7390551122062965e-05,
+      "loss": 0.3208,
+      "step": 385500
+    },
+    {
+      "epoch": 6.57,
+      "learning_rate": 2.7245744015892008e-05,
+      "loss": 0.3206,
+      "step": 386000
+    },
+    {
+      "epoch": 6.58,
+      "learning_rate": 2.7101457572929877e-05,
+      "loss": 0.3206,
+      "step": 386500
+    },
+    {
+      "epoch": 6.59,
+      "learning_rate": 2.6957693217225504e-05,
+      "loss": 0.3207,
+      "step": 387000
+    },
+    {
+      "epoch": 6.6,
+      "learning_rate": 2.6814452367675008e-05,
+      "loss": 0.3205,
+      "step": 387500
+    },
+    {
+      "epoch": 6.6,
+      "learning_rate": 2.6671736438007784e-05,
+      "loss": 0.3206,
+      "step": 388000
+    },
+    {
+      "epoch": 6.61,
+      "learning_rate": 2.6529830689765492e-05,
+      "loss": 0.3206,
+      "step": 388500
+    },
+    {
+      "epoch": 6.62,
+      "learning_rate": 2.6388167763455287e-05,
+      "loss": 0.3204,
+      "step": 389000
+    },
+    {
+      "epoch": 6.63,
+      "learning_rate": 2.62470339642853e-05,
+      "loss": 0.3204,
+      "step": 389500
+    },
+    {
+      "epoch": 6.64,
+      "learning_rate": 2.6106711361365064e-05,
+      "loss": 0.3206,
+      "step": 390000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c7132bd452806a1828ae1699a118b9aa68caeae454b47d624252df8772b23b65
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:b03a99e1730ed0b4ad5c89ac4a80049122fe9a7b433c61647b26278b007fbb43
 size 201355195