Training in progress, step 200000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8c7a1217516f1c133d24bb3d4b01300aff582a81619d3d1116de482975832802
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:db0082585963d0779a3f6f845b8a80f0898e8eedf6b822ae1abfa3c565e33123
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f20459a36d3d3a9cac8bb27dfd1c8133b9a775102f7d6624b00ef85ce8d11be2
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:54fb806d94f7814d043292764ccbf83208093216238755776971fd13549a8417
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7f51296829618cd3aac8b758ff1127e9862fd5e8cd0fd7abc8577a9160e237c7
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:02ff42f6c9444191a36be04b13f7af185230adc9bf275d0694e2347ba302132d
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:84dfd6945eb41b1cb519fcc4c855e9281eff7b5093625da74b060011b1ad4afd
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:effaa00a349e084c8da5b94ad9b11caf6487ba546f1186937a88a0177e674c2a
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d1e6eb189ca420ecc378796eb05160bf008f874b12982cf52f2ce307ad2df17d
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:a8cbaa6dd387c55ef769edc414fe52b33f735df38dad67cd88e3197b2fccab40
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:adc5617711a0cbdd1d1b3afd0601fc8e48a4056ca4765e9ca0a7b78f79204ba7
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:0660ca2210537ad62887c89aee0a6b18f7d33e103b3c25af90e948e70a018db8
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0a8b406f5f7aba898aebadaf3677cc3576d4f65c3fcd2a972307877861c6b081
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:c04d92b6e9668a995aa67c0fd2cccd57c4af61acd1f14d12f1653f5c4a66c8e5
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a4ecbc1c4a1b52f43722a40d7cfcf0cbe0e1616aac22cceabe9c1c72c5a195ea
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:f1aa56a28bbfa690d13bc1188d2e157d2070090a00f8611ce9f5fd886a2b26ea
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 3.3191462200321697,
-  "global_step": 195000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2346,6 +2346,66 @@
       "learning_rate": 0.00010374392960436561,
       "loss": 0.3369,
       "step": 195000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 3.404251878707415,
+  "global_step": 200000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00010374392960436561,
       "loss": 0.3369,
       "step": 195000
+    },
+    {
+      "epoch": 3.33,
+      "learning_rate": 0.00010353693881803657,
+      "loss": 0.3364,
+      "step": 195500
+    },
+    {
+      "epoch": 3.34,
+      "learning_rate": 0.00010332971573162363,
+      "loss": 0.3363,
+      "step": 196000
+    },
+    {
+      "epoch": 3.34,
+      "learning_rate": 0.00010312226239033498,
+      "loss": 0.336,
+      "step": 196500
+    },
+    {
+      "epoch": 3.35,
+      "learning_rate": 0.0001029145808416514,
+      "loss": 0.336,
+      "step": 197000
+    },
+    {
+      "epoch": 3.36,
+      "learning_rate": 0.00010270667313530591,
+      "loss": 0.3357,
+      "step": 197500
+    },
+    {
+      "epoch": 3.37,
+      "learning_rate": 0.0001024985413232636,
+      "loss": 0.3357,
+      "step": 198000
+    },
+    {
+      "epoch": 3.38,
+      "learning_rate": 0.0001022901874597015,
+      "loss": 0.3354,
+      "step": 198500
+    },
+    {
+      "epoch": 3.39,
+      "learning_rate": 0.00010208161360098805,
+      "loss": 0.3355,
+      "step": 199000
+    },
+    {
+      "epoch": 3.4,
+      "learning_rate": 0.00010187282180566307,
+      "loss": 0.3354,
+      "step": 199500
+    },
+    {
+      "epoch": 3.4,
+      "learning_rate": 0.00010166506882009926,
+      "loss": 0.3356,
+      "step": 200000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f20459a36d3d3a9cac8bb27dfd1c8133b9a775102f7d6624b00ef85ce8d11be2
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:54fb806d94f7814d043292764ccbf83208093216238755776971fd13549a8417
 size 201355195