Training in progress, step 160000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:180bd8afcb8ea5ad3ae5a04d5f826ec4d98e9451644a379bcab2f975d3632c6f
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:b8968668f8e27a4b1f96233ae49ecc50f9c5e2545b54cfd93a555e927df80094
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0454b1e243d2b5dca220df0685fba6335eb1b63797f2431af905499564f43e15
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:b89bdd1c6f08275cb2e1aa04e72a056b06bf108dbc0c3d5afa37eabd03b17492
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:70b73a32ed5abbbe50bd03d52cbc0d9f97f3bad9c8c83394d1113e5e9a9c7c63
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:f3b3067508029879e87896713b3349dd43bd7950f30ba5b07186a08274e98f7c
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4f22de639dadaf8f5ca48485412759765d7b50886c5fd569dc2a771bad6b9966
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:9474c05d6e8a6f5b3019c66a256463bb7adb6a64e5874719f1764013b2276887
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b862981d7b744793ba14de4eb91fa95c39e539315482c513f3de839b7f196be9
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:acc0bbfd6cb18044a737e07a313f5f858ebe57567f2d9d9913eda502ae80129e
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a842a7ac403f25c499f6e5769786574ac0afe54e735c6b7d2cf5e5b07eb1651b
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:2f8038127f9fec31bcc4140df87dba7f06dcbd7f6877e348434496dc82dc7b3e
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ae031280daf8907f446f3bdbb161df8e5e839f1f031c6cce17991477b9b4dddf
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:0c96c7d78c8952f41e39235dd3c789bd91208bed751957c893a54fb569c1a59d
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:068e1b75a2254acb81dd3afc8ec00c3c6ffb9c49ea1f1957f47f3efdd8db87e2
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:942a796eb949e7a972ad24a9f551ee4a24f1d706d7871dd44739891b623c5763
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.63829244006434,
-  "global_step": 155000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1866,6 +1866,66 @@
       "learning_rate": 0.00011936802347035692,
       "loss": 0.3417,
       "step": 155000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.723398098739585,
+  "global_step": 160000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00011936802347035692,
       "loss": 0.3417,
       "step": 155000
+    },
+    {
+      "epoch": 2.65,
+      "learning_rate": 0.00011918599236764778,
+      "loss": 0.3415,
+      "step": 155500
+    },
+    {
+      "epoch": 2.66,
+      "learning_rate": 0.00011900357451501401,
+      "loss": 0.3417,
+      "step": 156000
+    },
+    {
+      "epoch": 2.66,
+      "learning_rate": 0.00011882077171284612,
+      "loss": 0.3421,
+      "step": 156500
+    },
+    {
+      "epoch": 2.67,
+      "learning_rate": 0.00011863795251840704,
+      "loss": 0.3414,
+      "step": 157000
+    },
+    {
+      "epoch": 2.68,
+      "learning_rate": 0.00011845512101771738,
+      "loss": 0.3419,
+      "step": 157500
+    },
+    {
+      "epoch": 2.69,
+      "learning_rate": 0.00011827117647893832,
+      "loss": 0.3414,
+      "step": 158000
+    },
+    {
+      "epoch": 2.7,
+      "learning_rate": 0.0001180868542190981,
+      "loss": 0.3423,
+      "step": 158500
+    },
+    {
+      "epoch": 2.71,
+      "learning_rate": 0.00011790215605738305,
+      "loss": 0.3417,
+      "step": 159000
+    },
+    {
+      "epoch": 2.71,
+      "learning_rate": 0.00011771708381668941,
+      "loss": 0.3412,
+      "step": 159500
+    },
+    {
+      "epoch": 2.72,
+      "learning_rate": 0.00011753163932360551,
+      "loss": 0.3408,
+      "step": 160000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0454b1e243d2b5dca220df0685fba6335eb1b63797f2431af905499564f43e15
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:b89bdd1c6f08275cb2e1aa04e72a056b06bf108dbc0c3d5afa37eabd03b17492
 size 201355195