Training in progress, step 395000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fee40aa1a6fbacfee552fffa429a1bb6a6bbe0587a8c00ceeeb72d56fcc5491b
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:8badaf858040e9a408943a6e9fbd7b673381f667c74f44da38b93b7faa806cd6
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b03a99e1730ed0b4ad5c89ac4a80049122fe9a7b433c61647b26278b007fbb43
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:a7e0679255ea6b36201b0d808a362cef9e0cc4250bf2a27a7d227fb77c38b5a3
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ba2482f8cf2440cec0254d5988cce37640442e59f079fb17bd6bcd415e99bcb1
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:321f848c05abd7bede59850502e9582f8a2efa51300e70f7c4e42416383b1f9d
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d70e0b0c79d2fa6d6a28c01c5bc090995fd291533a40cd841db17d67210ae78a
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:7173cab8fec53de370fc776b8ec60abd28823c70815e5aae8f471b1d4cd8593a
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9a3fc66b05c070cd63ffd00ff8eb77c5a4d2302ca4f6995b3280fe94d5663ac9
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:9bbf3b61889bf57772bca69e3fa2b3a58e51beabaa460befd9b8ff1bc01f45da
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8bacc9e2fc4f21f22254517223c74cdcb7c52a6a0ffca9793eaf062a0287de1d
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:053726ed745fa923b4c9b6b87c5501b19122cc00993e8b017178f10a7f218f5b
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:684e728a687523626e6715432733611e4b4256378736ca4bcaa27753a07851d5
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:062ee8ab98f80273aee87dab235a0bc7258dc420c22cabc1af7c5b580c42129d
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e66e0b2e2c0276f2bbbbb229f2d3a165b984c5fe5faf07983c7e165b1a34186
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:09de475ccd38f92b9bb28c41a7de8a4a2d4763ec7818473a0c7e4d4586d6efeb
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 6.6382924400643395,
-  "global_step": 390000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -4686,6 +4686,66 @@
       "learning_rate": 2.6106711361365064e-05,
       "loss": 0.3206,
       "step": 390000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 6.723398098739585,
+  "global_step": 395000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.6106711361365064e-05,
       "loss": 0.3206,
       "step": 390000
+    },
+    {
+      "epoch": 6.65,
+      "learning_rate": 2.5966638924843332e-05,
+      "loss": 0.3204,
+      "step": 390500
+    },
+    {
+      "epoch": 6.66,
+      "learning_rate": 2.5827099775781274e-05,
+      "loss": 0.3204,
+      "step": 391000
+    },
+    {
+      "epoch": 6.66,
+      "learning_rate": 2.5688095291373918e-05,
+      "loss": 0.3203,
+      "step": 391500
+    },
+    {
+      "epoch": 6.67,
+      "learning_rate": 2.554962684353946e-05,
+      "loss": 0.3203,
+      "step": 392000
+    },
+    {
+      "epoch": 6.68,
+      "learning_rate": 2.5411695798905557e-05,
+      "loss": 0.3205,
+      "step": 392500
+    },
+    {
+      "epoch": 6.69,
+      "learning_rate": 2.5274303518795908e-05,
+      "loss": 0.3206,
+      "step": 393000
+    },
+    {
+      "epoch": 6.7,
+      "learning_rate": 2.513745135921688e-05,
+      "loss": 0.3203,
+      "step": 393500
+    },
+    {
+      "epoch": 6.71,
+      "learning_rate": 2.5001412750937412e-05,
+      "loss": 0.3205,
+      "step": 394000
+    },
+    {
+      "epoch": 6.71,
+      "learning_rate": 2.4865643792130036e-05,
+      "loss": 0.3204,
+      "step": 394500
+    },
+    {
+      "epoch": 6.72,
+      "learning_rate": 2.473041898715981e-05,
+      "loss": 0.3201,
+      "step": 395000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b03a99e1730ed0b4ad5c89ac4a80049122fe9a7b433c61647b26278b007fbb43
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:a7e0679255ea6b36201b0d808a362cef9e0cc4250bf2a27a7d227fb77c38b5a3
 size 201355195