Training in progress, step 12200

Browse files

Files changed (11) hide show

{checkpoint-11600 → checkpoint-12200}/config.json +0 -0
{checkpoint-11600 → checkpoint-12200}/optimizer.pt +1 -1
{checkpoint-11600 → checkpoint-12200}/preprocessor_config.json +0 -0
{checkpoint-11600 → checkpoint-12200}/pytorch_model.bin +1 -1
{checkpoint-11600 → checkpoint-12200}/rng_state.pth +2 -2
{checkpoint-11600 → checkpoint-12200}/scaler.pt +1 -1
{checkpoint-11600 → checkpoint-12200}/scheduler.pt +1 -1
{checkpoint-11600 → checkpoint-12200}/trainer_state.json +75 -3
{checkpoint-11600 → checkpoint-12200}/training_args.bin +0 -0
pytorch_model.bin +1 -1
runs/Feb29_06-40-12_88ba3e3089b0/events.out.tfevents.1709188854.88ba3e3089b0.584.0 +2 -2

{checkpoint-11600 → checkpoint-12200}/config.json RENAMED Viewed

File without changes

{checkpoint-11600 → checkpoint-12200}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ba9ebd2cb340a71369a53abe1497f25128c8aabf9d1330dc4084498a66707958
 size 330501178

 version https://git-lfs.github.com/spec/v1
+oid sha256:bc515a01e9e2331272e2688ab26d150060ee5b4d18b46a5039892b1fe7a60bc9
 size 330501178

{checkpoint-11600 → checkpoint-12200}/preprocessor_config.json RENAMED Viewed

File without changes

{checkpoint-11600 → checkpoint-12200}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f6be8a1e7c46e218316192ae1521c8cc3fea19e48bea7a4413093de0babd368f
 size 166628834

 version https://git-lfs.github.com/spec/v1
+oid sha256:0f3d6ecb7d0de9b755ff2254f0b23a59bdebac0f0720a7a7f6bf6137dda88820
 size 166628834

{checkpoint-11600 → checkpoint-12200}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1bbe03c165858e427bf1690c78aca8d29770dca019e5d87ae12c45ed31926031
-size 14180

 version https://git-lfs.github.com/spec/v1
+oid sha256:4035ceaade5bbf92f1d33853f1f79f9f758c53575371225b56f7833007fbb057
+size 14308

{checkpoint-11600 → checkpoint-12200}/scaler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e9eef046ab22a76d8c7502f6eed706ed994dc76c1182ca7dc0096a858466626b
 size 988

 version https://git-lfs.github.com/spec/v1
+oid sha256:8de62983e80550d154137c9abb3ad8c5a0b825753ca3b5128cd86472366c6609
 size 988

{checkpoint-11600 → checkpoint-12200}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:eae3e6dc44dcb169f3179fa7f6c9297649ce7525dbcd15721ef74297edd0ca3d
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:442fd94f442ef422e03ea26344ef677e888ff84597c1ac6626f845997b27ddfb
 size 1064

{checkpoint-11600 → checkpoint-12200}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.2040661219836597,
-  "global_step": 11600,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1398,11 +1398,83 @@
       "learning_rate": 7.798593957818735e-06,
       "loss": 0.9419,
       "step": 11600
     }
   ],
   "max_steps": 52630,
   "num_train_epochs": 10,
-  "total_flos": 4.434980288707584e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.3180695420862625,
+  "global_step": 12200,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 7.798593957818735e-06,
       "loss": 0.9419,
       "step": 11600
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 7.789093672810185e-06,
+      "loss": 0.9078,
+      "step": 11650
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 7.779593387801634e-06,
+      "loss": 0.9313,
+      "step": 11700
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 7.770093102793086e-06,
+      "loss": 0.9452,
+      "step": 11750
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 7.760592817784535e-06,
+      "loss": 0.9401,
+      "step": 11800
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 7.751092532775983e-06,
+      "loss": 0.9278,
+      "step": 11850
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 7.741592247767434e-06,
+      "loss": 0.931,
+      "step": 11900
+    },
+    {
+      "epoch": 2.27,
+      "learning_rate": 7.732091962758883e-06,
+      "loss": 0.9436,
+      "step": 11950
+    },
+    {
+      "epoch": 2.28,
+      "learning_rate": 7.722591677750333e-06,
+      "loss": 0.9212,
+      "step": 12000
+    },
+    {
+      "epoch": 2.29,
+      "learning_rate": 7.713091392741782e-06,
+      "loss": 0.95,
+      "step": 12050
+    },
+    {
+      "epoch": 2.3,
+      "learning_rate": 7.703591107733232e-06,
+      "loss": 0.9701,
+      "step": 12100
+    },
+    {
+      "epoch": 2.31,
+      "learning_rate": 7.694090822724683e-06,
+      "loss": 0.9402,
+      "step": 12150
+    },
+    {
+      "epoch": 2.32,
+      "learning_rate": 7.684590537716132e-06,
+      "loss": 0.9419,
+      "step": 12200
     }
   ],
   "max_steps": 52630,
   "num_train_epochs": 10,
+  "total_flos": 4.664385709046784e+19,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-11600 → checkpoint-12200}/training_args.bin RENAMED Viewed

File without changes

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ce7ead05fff3caa3b7b28d20216da8399f0f8d3c59ad03f41369e9196756b69b
 size 166628834

 version https://git-lfs.github.com/spec/v1
+oid sha256:0f3d6ecb7d0de9b755ff2254f0b23a59bdebac0f0720a7a7f6bf6137dda88820
 size 166628834

runs/Feb29_06-40-12_88ba3e3089b0/events.out.tfevents.1709188854.88ba3e3089b0.584.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d3b34a889cd4bdc6538d73ca2cc4228cd65651810682322161e9a1861284cfe5
-size 42815

 version https://git-lfs.github.com/spec/v1
+oid sha256:1fa5e17d1caff09ce99c86d4fe4fc1855344e39766bd7effb3b06b7eec178394
+size 43443