Training in progress, step 145000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:88502487669ed48c5b81d5668e89156ca00d459ffec5303442cc864943528e45
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:3dfe64e849ed38be0c116bf69502ab6ef673c3bfbb07d2a79ac601fd7abada84
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:df9892519dbd6116b68b1382f6bef13a8948e72a1f7cdfd140a44813466337bd
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:655b828bf25e09d93b3a829341a96b780ef65754b049aae3719f02e2c2832c66
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:518d0c98c26e535dd659b44ad27605870644d0174fe82b5b955b8c75913da3f5
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:eaa575de425b3b6c389e6e8114c168b50828ecdc45cd1c9d7720b1b0c56d3927
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1dbd3b927f188de94763ae6dc5d2ab91c1f2f3e8c7e56ca840acc9f783d0c6d4
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:0e2381d7111aef0a952be74ccc43cf3d5aa266953bd08dd244c0a6b9d757e25d
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:75dda0801167aeaa5255929f5576e748485109db796bcd6a0701c192fcac2bdc
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:da9027a0e55164e62a390848b61914abfd2e8c206179d8f0b6727d85ed77643f
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b3fe0f7ed2afce033c8d24222ffcba0f571c8b93d6124174a974b413ce6e4cd
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:d8e2fe6e6bdabd7edc33ae3f760b1ec4396638c232770774464ee59bd6e64ff7
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:43c0a8099e9a7e853a472bfc2b42aadd31fdf32da1dafad4f35b19f8984441e1
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:5da286168e5064f0d0a7ce456ddb33da625498b14979026402cfccd39d5838b1
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7a764d29a3460312afa48d75bfde217931b9b606545018d900461c5290efd3e7
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:79d75c9447e835638ffa3474c117803239ed9981e80652713d41db8acbe224ff
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.382978723404255,
-  "global_step": 140000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1686,6 +1686,66 @@
       "learning_rate": 0.00012463797674266635,
       "loss": 0.3409,
       "step": 140000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.4680851063829787,
+  "global_step": 145000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00012463797674266635,
       "loss": 0.3409,
       "step": 140000
+    },
+    {
+      "epoch": 2.39,
+      "learning_rate": 0.00012446835960053801,
+      "loss": 0.3407,
+      "step": 140500
+    },
+    {
+      "epoch": 2.4,
+      "learning_rate": 0.000124298303573653,
+      "loss": 0.3406,
+      "step": 141000
+    },
+    {
+      "epoch": 2.41,
+      "learning_rate": 0.0001241278103403957,
+      "loss": 0.3405,
+      "step": 141500
+    },
+    {
+      "epoch": 2.42,
+      "learning_rate": 0.00012395722387451133,
+      "loss": 0.3406,
+      "step": 142000
+    },
+    {
+      "epoch": 2.43,
+      "learning_rate": 0.00012378586214689284,
+      "loss": 0.3403,
+      "step": 142500
+    },
+    {
+      "epoch": 2.43,
+      "learning_rate": 0.000123614068270492,
+      "loss": 0.3402,
+      "step": 143000
+    },
+    {
+      "epoch": 2.44,
+      "learning_rate": 0.00012344184394084504,
+      "loss": 0.3398,
+      "step": 143500
+    },
+    {
+      "epoch": 2.45,
+      "learning_rate": 0.00012326919085773659,
+      "loss": 0.34,
+      "step": 144000
+    },
+    {
+      "epoch": 2.46,
+      "learning_rate": 0.00012309611072518285,
+      "loss": 0.3397,
+      "step": 144500
+    },
+    {
+      "epoch": 2.47,
+      "learning_rate": 0.00012292260525141485,
+      "loss": 0.34,
+      "step": 145000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:df9892519dbd6116b68b1382f6bef13a8948e72a1f7cdfd140a44813466337bd
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:655b828bf25e09d93b3a829341a96b780ef65754b049aae3719f02e2c2832c66
 size 201355195