Training in progress, step 485000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3ffd4c2a109a9e135f9e2cb7cc828c1911698c33d1ccf5fdca1593df34bb8086
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:d893568f1b98d344be31605b8fae96006b46a052189571c91e8e7ad3d7d78aa0
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0d212205555a22147e8aebc90c2a3779922ada08fea6366382eebbae33ef7733
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:1ccac6cfd193e438464e5b6e186f7cfb7a9fd45fac4373893748d8948cac56c4
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:26b1826817e810c9dc45f2909a7e45f769a2500bdd1f428015f13cf25e473141
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:011ebe7c11d42cd0a1c9b353a4965be6c7e082f73fc7473a2a615e866449a3b0
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3fa0832929a00ea6055e699b75a7627daf7b17e107be598a3fe2d7a9281e0924
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:637dc4bb1fca17ae7fe8b636a8730cdbeb63210200e935b533f565d1c0df8760
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:187fd12f48b591a20353530c604c3cc719ffd86a7dce827c1fb47a37b3150193
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:f17a75302e0f04f282b97e3b350868a9f3d9c32fda1e8e8967e950ebb8a6f6fa
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bb6a46b112d7ab2d19eb05a1f181a7fa13271e6e08017cda1263c31506394cdf
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:b61883c7448b2ee328c7d8245911d6c0b73c91036e9453c3237361bcca67410c
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6bca461a5fb77b29582a161948272cc1f36cfc27055cf6cde6a878ddd99b607c
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:9adb8b1f94ae4dfb98288f1d9b1d42fa2616a61139269170f13efbd2d3c52aac
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a4c3fc190a91ef93911570e5ff0dc0da8ca87cb849c536f2494eefe91a266c5e
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:18d51d5350efcb705648a3973831fb0ad4e4c422f14bb0cb6af95016a44e9103
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 8.17021131735049,
-  "global_step": 480000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -5766,6 +5766,66 @@
       "learning_rate": 1.0562215843511462e-05,
       "loss": 0.3186,
       "step": 480000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 8.255316976025735,
+  "global_step": 485000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.0562215843511462e-05,
       "loss": 0.3186,
       "step": 480000
+    },
+    {
+      "epoch": 8.18,
+      "learning_rate": 1.0534742744692915e-05,
+      "loss": 0.3186,
+      "step": 480500
+    },
+    {
+      "epoch": 8.19,
+      "learning_rate": 1.0507955239919215e-05,
+      "loss": 0.3185,
+      "step": 481000
+    },
+    {
+      "epoch": 8.2,
+      "learning_rate": 1.0481853593572226e-05,
+      "loss": 0.3184,
+      "step": 481500
+    },
+    {
+      "epoch": 8.2,
+      "learning_rate": 1.0456488209413605e-05,
+      "loss": 0.3185,
+      "step": 482000
+    },
+    {
+      "epoch": 8.21,
+      "learning_rate": 1.0431757673006884e-05,
+      "loss": 0.3184,
+      "step": 482500
+    },
+    {
+      "epoch": 8.22,
+      "learning_rate": 1.0407713747066088e-05,
+      "loss": 0.3184,
+      "step": 483000
+    },
+    {
+      "epoch": 8.23,
+      "learning_rate": 1.038435666889507e-05,
+      "loss": 0.3186,
+      "step": 483500
+    },
+    {
+      "epoch": 8.24,
+      "learning_rate": 1.036168666901875e-05,
+      "loss": 0.3183,
+      "step": 484000
+    },
+    {
+      "epoch": 8.25,
+      "learning_rate": 1.0339747250503798e-05,
+      "loss": 0.3185,
+      "step": 484500
+    },
+    {
+      "epoch": 8.26,
+      "learning_rate": 1.0318450696414725e-05,
+      "loss": 0.3186,
+      "step": 485000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0d212205555a22147e8aebc90c2a3779922ada08fea6366382eebbae33ef7733
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:1ccac6cfd193e438464e5b6e186f7cfb7a9fd45fac4373893748d8948cac56c4
 size 201355195