Training in progress, step 385000

Browse files

Files changed (10) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +62 -2
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f8272af4ddd50ac3c03d82b6371903a8e2d3b850546bd45a9f8b94a3453985af
 size 402588883

 version https://git-lfs.github.com/spec/v1
+oid sha256:18de3f7cc4a91ac6868744a9cd20f39edaebacb5665b74cf4f2175021a0edb90
 size 402588883

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:28618062dba6742c58cd97862917d0e5cce7292726a4d65b550febad17e88fa8
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:c7132bd452806a1828ae1699a118b9aa68caeae454b47d624252df8772b23b65
 size 201355195

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5de7856e29d324fe8b2d7a8039c54b4faff384ee2fadaf89719b8ee47b48cf0c
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:53e62c4c1922f2a1587e8d53c73b96e423282fb6d6259d9ca0f71ac25e5e8153
 size 14503

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f0dd029a7e6530ace2ca7d9672c2c2caa1be55bd585e32a5581428856929e03f
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:10f7532403f5b493736d56d3ea7cc99fbf67e90d193efeb30456688505225f32
 size 14503

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:57d4b43fb88447123981547f4327ac577192580fb4ced52d9deda508c9b8d482
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:a4e2f6272d55d9d66dae051add9b1254b4bef8eb2c18fe3b5027696d129a3821
 size 14503

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:81980e5ddbb31a0d475d91342667e7ec7c33d09f8b11bc51c09d140f2402de83
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:28a933ecd96bcb0ef9d59cde72c7a2f327911f311001e588d3f029f5f85e1a29
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bcf90e1e79ee4934f7f14472b5dc245979542d20b81316a586ad390ebbd17f9c
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:0634118a00ed086ccf276fc79772adc912101484932dd3c63dd24fd9eb2718ce
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3230a86e29e9aa1af252bbac77fbb562b1bc880e11ef24d2344026ff504c2e85
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:468447bff0f0da8cbb0e93720be4efb28f0be877ee6d17ac6e3f1416931c3f00
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 6.4680811227138495,
-  "global_step": 380000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -4566,6 +4566,66 @@
       "learning_rate": 2.9016777909103095e-05,
       "loss": 0.3207,
       "step": 380000
     }
   ],
   "max_steps": 500000,

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 6.553186781389095,
+  "global_step": 385000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.9016777909103095e-05,
       "loss": 0.3207,
       "step": 380000
+    },
+    {
+      "epoch": 6.48,
+      "learning_rate": 2.88663409700897e-05,
+      "loss": 0.3209,
+      "step": 380500
+    },
+    {
+      "epoch": 6.49,
+      "learning_rate": 2.8716408699647456e-05,
+      "loss": 0.3207,
+      "step": 381000
+    },
+    {
+      "epoch": 6.49,
+      "learning_rate": 2.85669825775473e-05,
+      "loss": 0.3207,
+      "step": 381500
+    },
+    {
+      "epoch": 6.5,
+      "learning_rate": 2.8418064078564776e-05,
+      "loss": 0.3208,
+      "step": 382000
+    },
+    {
+      "epoch": 6.51,
+      "learning_rate": 2.8269950982228437e-05,
+      "loss": 0.3208,
+      "step": 382500
+    },
+    {
+      "epoch": 6.52,
+      "learning_rate": 2.8122051111179246e-05,
+      "loss": 0.3207,
+      "step": 383000
+    },
+    {
+      "epoch": 6.53,
+      "learning_rate": 2.7974663254541644e-05,
+      "loss": 0.3208,
+      "step": 383500
+    },
+    {
+      "epoch": 6.54,
+      "learning_rate": 2.782778886697424e-05,
+      "loss": 0.3208,
+      "step": 384000
+    },
+    {
+      "epoch": 6.54,
+      "learning_rate": 2.768172160215594e-05,
+      "loss": 0.3205,
+      "step": 384500
+    },
+    {
+      "epoch": 6.55,
+      "learning_rate": 2.753587746225503e-05,
+      "loss": 0.3208,
+      "step": 385000
     }
   ],
   "max_steps": 500000,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:28618062dba6742c58cd97862917d0e5cce7292726a4d65b550febad17e88fa8
 size 201355195

 version https://git-lfs.github.com/spec/v1
+oid sha256:c7132bd452806a1828ae1699a118b9aa68caeae454b47d624252df8772b23b65
 size 201355195