Training in progress, step 12000

Browse files

Files changed (11) hide show

{checkpoint-11400 → checkpoint-12000}/config.json +0 -0
{checkpoint-11400 → checkpoint-12000}/optimizer.pt +1 -1
{checkpoint-11400 → checkpoint-12000}/preprocessor_config.json +0 -0
{checkpoint-11400 → checkpoint-12000}/pytorch_model.bin +1 -1
{checkpoint-11400 → checkpoint-12000}/rng_state.pth +2 -2
{checkpoint-11400 → checkpoint-12000}/scaler.pt +1 -1
{checkpoint-11400 → checkpoint-12000}/scheduler.pt +1 -1
{checkpoint-11400 → checkpoint-12000}/trainer_state.json +75 -3
{checkpoint-11400 → checkpoint-12000}/training_args.bin +0 -0
pytorch_model.bin +1 -1
runs/Feb29_06-40-12_88ba3e3089b0/events.out.tfevents.1709188854.88ba3e3089b0.584.0 +2 -2

{checkpoint-11400 → checkpoint-12000}/config.json RENAMED Viewed

File without changes

{checkpoint-11400 → checkpoint-12000}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:51059b9f784869f50dd486eb75789ff1100313039cd9915ccdc24d02f4a54362
 size 330501178

 version https://git-lfs.github.com/spec/v1
+oid sha256:2e394c8c5d4f935ff0aee7a185e6aa2e5c3eafb4ec593dfda34f42f03cf70a38
 size 330501178

{checkpoint-11400 → checkpoint-12000}/preprocessor_config.json RENAMED Viewed

File without changes

{checkpoint-11400 → checkpoint-12000}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7548a6ca2f5ae4a311faa32c37a23c748dfe15d36185ec0c99e9131ccf462a42
 size 166628834

 version https://git-lfs.github.com/spec/v1
+oid sha256:ce7ead05fff3caa3b7b28d20216da8399f0f8d3c59ad03f41369e9196756b69b
 size 166628834

{checkpoint-11400 → checkpoint-12000}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e6d15c9ab1a39bc9cbeba851393001f0b83f94fa83870124e670ed5ce08dfb59
-size 14180

 version https://git-lfs.github.com/spec/v1
+oid sha256:42099ca80a2827f586e2cd0357b4bc186e31647613412ebe9b9139558b0086db
+size 14244

{checkpoint-11400 → checkpoint-12000}/scaler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bac664126ce3c5e13e744c139ee130c846e9a0d1d9dc5ca209b2be886e743fce
 size 988

 version https://git-lfs.github.com/spec/v1
+oid sha256:901ccc6b629ca31f80d8fcc7094c82ebb007876337324efbc24cfb3fffb68ca6
 size 988

{checkpoint-11400 → checkpoint-12000}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2a7082b2db3c89cb9935a0d0e0d465ce412b06cd4a642b4dd7a786feb67e5376
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:efe7bb4cfa76efc67c49531c06369642b1628cfa905abd33637961592c6799ba
 size 1064

{checkpoint-11400 → checkpoint-12000}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.1660649819494586,
-  "global_step": 11400,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1374,11 +1374,83 @@
       "learning_rate": 7.836595097852936e-06,
       "loss": 0.9605,
       "step": 11400
     }
   ],
   "max_steps": 52630,
   "num_train_epochs": 10,
-  "total_flos": 4.358511815261184e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.2800684020520614,
+  "global_step": 12000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 7.836595097852936e-06,
       "loss": 0.9605,
       "step": 11400
+    },
+    {
+      "epoch": 2.18,
+      "learning_rate": 7.827094812844385e-06,
+      "loss": 0.9283,
+      "step": 11450
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 7.817594527835835e-06,
+      "loss": 0.9115,
+      "step": 11500
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 7.808094242827286e-06,
+      "loss": 0.9508,
+      "step": 11550
+    },
+    {
+      "epoch": 2.2,
+      "learning_rate": 7.798593957818735e-06,
+      "loss": 0.9419,
+      "step": 11600
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 7.789093672810185e-06,
+      "loss": 0.9078,
+      "step": 11650
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 7.779593387801634e-06,
+      "loss": 0.9313,
+      "step": 11700
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 7.770093102793086e-06,
+      "loss": 0.9452,
+      "step": 11750
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 7.760592817784535e-06,
+      "loss": 0.9401,
+      "step": 11800
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 7.751092532775983e-06,
+      "loss": 0.9278,
+      "step": 11850
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 7.741592247767434e-06,
+      "loss": 0.931,
+      "step": 11900
+    },
+    {
+      "epoch": 2.27,
+      "learning_rate": 7.732091962758883e-06,
+      "loss": 0.9436,
+      "step": 11950
+    },
+    {
+      "epoch": 2.28,
+      "learning_rate": 7.722591677750333e-06,
+      "loss": 0.9212,
+      "step": 12000
     }
   ],
   "max_steps": 52630,
   "num_train_epochs": 10,
+  "total_flos": 4.587917235600384e+19,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-11400 → checkpoint-12000}/training_args.bin RENAMED Viewed

File without changes

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:941f644e8d17ec96d3c53c66b204f2d746989d17f3afd50aef4a79442ed41cb8
 size 166628834

 version https://git-lfs.github.com/spec/v1
+oid sha256:ce7ead05fff3caa3b7b28d20216da8399f0f8d3c59ad03f41369e9196756b69b
 size 166628834

runs/Feb29_06-40-12_88ba3e3089b0/events.out.tfevents.1709188854.88ba3e3089b0.584.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ba88144b93f482dc63e502f528b19a12f86253af64663b386b0894fbeb13610b
-size 42187

 version https://git-lfs.github.com/spec/v1
+oid sha256:d3b34a889cd4bdc6538d73ca2cc4228cd65651810682322161e9a1861284cfe5
+size 42815