Training in progress, step 13800

Browse files

Files changed (11) hide show

{checkpoint-13200 → checkpoint-13800}/config.json +0 -0
{checkpoint-13200 → checkpoint-13800}/optimizer.pt +1 -1
{checkpoint-13200 → checkpoint-13800}/preprocessor_config.json +0 -0
{checkpoint-13200 → checkpoint-13800}/pytorch_model.bin +1 -1
{checkpoint-13200 → checkpoint-13800}/rng_state.pth +1 -1
{checkpoint-13200 → checkpoint-13800}/scaler.pt +1 -1
{checkpoint-13200 → checkpoint-13800}/scheduler.pt +1 -1
{checkpoint-13200 → checkpoint-13800}/trainer_state.json +75 -3
{checkpoint-13200 → checkpoint-13800}/training_args.bin +0 -0
pytorch_model.bin +1 -1
runs/Feb29_13-56-06_3a0664c7c2dd/events.out.tfevents.1709215109.3a0664c7c2dd.2321.0 +2 -2

{checkpoint-13200 → checkpoint-13800}/config.json RENAMED Viewed

File without changes

{checkpoint-13200 → checkpoint-13800}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ef36ca8c8c70233abc7a8cee6a5d1a0555740766ca04707bae03e3f0c580c5f7
 size 330501178

 version https://git-lfs.github.com/spec/v1
+oid sha256:914978b2a4788b287da0c998e5aacef46d279ce11afef35e802cfb5b777a0f5f
 size 330501178

{checkpoint-13200 → checkpoint-13800}/preprocessor_config.json RENAMED Viewed

File without changes

{checkpoint-13200 → checkpoint-13800}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a603da01c74d9504c35845be6ee4365c2df4b2bd1c14a68b036545f8b9bfe0cf
 size 166628834

 version https://git-lfs.github.com/spec/v1
+oid sha256:3843b02ee5ae11c37ff2887d62bb97a97af3189ee614e15e6c71c023fa806df5
 size 166628834

{checkpoint-13200 → checkpoint-13800}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:baeb722c7eb9df4195b8f19894482c730fd38333b5ab545d6c278f67dba1e795
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:d593abced29e6f34e3600625cf827fd4591fcf821bb4f9bff7add8ae91e99077
 size 14244

{checkpoint-13200 → checkpoint-13800}/scaler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9a14aac3f1a42a5643173abb85e00e68e78f46b63a124973b1fb9b5013022b7a
 size 988

 version https://git-lfs.github.com/spec/v1
+oid sha256:2ee1413e1cf9c272323ce5f4dece3c6a0e346bfd0db69d70c75a91f9fbae55f4
 size 988

{checkpoint-13200 → checkpoint-13800}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:811bdd1945539ce0d69d353e2dedff42b36763d7e95bd7d48ace3a36632e96c8
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:fb1b01715c4d4978b8bd9921ee2051456f9f8e18431463aed7053a7c4d3d0170
 size 1064

{checkpoint-13200 → checkpoint-13800}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.508075242257268,
-  "global_step": 13200,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1590,11 +1590,83 @@
       "learning_rate": 7.494584837545127e-06,
       "loss": 0.9041,
       "step": 13200
     }
   ],
   "max_steps": 52630,
   "num_train_epochs": 10,
-  "total_flos": 5.046728076278784e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.6220786623598706,
+  "global_step": 13800,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 7.494584837545127e-06,
       "loss": 0.9041,
       "step": 13200
+    },
+    {
+      "epoch": 2.52,
+      "learning_rate": 7.485274558236748e-06,
+      "loss": 0.9399,
+      "step": 13250
+    },
+    {
+      "epoch": 2.53,
+      "learning_rate": 7.475774273228198e-06,
+      "loss": 0.9176,
+      "step": 13300
+    },
+    {
+      "epoch": 2.54,
+      "learning_rate": 7.466273988219647e-06,
+      "loss": 0.9235,
+      "step": 13350
+    },
+    {
+      "epoch": 2.55,
+      "learning_rate": 7.456773703211096e-06,
+      "loss": 0.8947,
+      "step": 13400
+    },
+    {
+      "epoch": 2.56,
+      "learning_rate": 7.4472734182025465e-06,
+      "loss": 0.9205,
+      "step": 13450
+    },
+    {
+      "epoch": 2.57,
+      "learning_rate": 7.437773133193996e-06,
+      "loss": 0.9188,
+      "step": 13500
+    },
+    {
+      "epoch": 2.57,
+      "learning_rate": 7.428272848185446e-06,
+      "loss": 0.9285,
+      "step": 13550
+    },
+    {
+      "epoch": 2.58,
+      "learning_rate": 7.418772563176896e-06,
+      "loss": 0.93,
+      "step": 13600
+    },
+    {
+      "epoch": 2.59,
+      "learning_rate": 7.409272278168346e-06,
+      "loss": 0.9355,
+      "step": 13650
+    },
+    {
+      "epoch": 2.6,
+      "learning_rate": 7.3997719931597955e-06,
+      "loss": 0.9297,
+      "step": 13700
+    },
+    {
+      "epoch": 2.61,
+      "learning_rate": 7.390271708151245e-06,
+      "loss": 0.9037,
+      "step": 13750
+    },
+    {
+      "epoch": 2.62,
+      "learning_rate": 7.380771423142695e-06,
+      "loss": 0.9066,
+      "step": 13800
     }
   ],
   "max_steps": 52630,
   "num_train_epochs": 10,
+  "total_flos": 5.276133496617984e+19,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-13200 → checkpoint-13800}/training_args.bin RENAMED Viewed

File without changes

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0d4989b2d7f4cae57b5a3aa1cf86e415ff5b1965edd161d195369354348da688
 size 166628834

 version https://git-lfs.github.com/spec/v1
+oid sha256:3843b02ee5ae11c37ff2887d62bb97a97af3189ee614e15e6c71c023fa806df5
 size 166628834

runs/Feb29_13-56-06_3a0664c7c2dd/events.out.tfevents.1709215109.3a0664c7c2dd.2321.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c1d5debafc9304f7db453dcd62a7183edc61c47e61bd1ddedd70eef86531d738
-size 9537

 version https://git-lfs.github.com/spec/v1
+oid sha256:5420ea52b1a60c7d79aba070b7a3c2d00dbef6cff73689c11e602a6ead721e49
+size 10165