Training in progress, step 99000

Files changed (10) hide show

.gitattributes CHANGED Viewed

@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+log.txt filter=lfs diff=lfs merge=lfs -text

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f883377702d8f113630455e79f29afa5de1ed623717f6ed0d55128bca09cdac6
 size 538943941

 version https://git-lfs.github.com/spec/v1
+oid sha256:bb6e7c33c0689e6c3298ded6c7a90382868146c4308e6c82b556a0111b8b1259
 size 538943941

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:103ae63eb15642bd84b830bf18d49ff1e4734c3ae7b347dcb11f41f4c2740c49
 size 269468281

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5eb3d7defb1c32bd6fc4a21ab99f020092d22e7be3eb53044a485f9035ce1b7
 size 269468281

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9cceeaef5cadb9f75354fe0dc0f06f637f72402bdbf35192020c853cf8173ab4
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:f8326297abcf2a1908b1a767fe60d17987a26f2c5604b81b26fa14b663ae5bff
 size 14575

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fc177a0f1f66d3affc300ca46f0c523e126a8424d299076516cb8961cc272a5a
 size 557

 version https://git-lfs.github.com/spec/v1
+oid sha256:da692e8a61b0469d66a05ee87d5569d6a98e9a4d9ac49ff837bd9b7979d7ad48
 size 557

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:06d129a7a9141688975b2505e1d057ad3fdb45901890c70149479744954d70eb
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:eed58ddd784a948e5c48af7e5967f7f6677bd7d9091292c0e7d8f98ed90e5eb2
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": 1.4165735244750977,
   "best_model_checkpoint": "/home/pcjf/CESGA/works/lmodels/models/tiny/checkpoint-98500",
-  "epoch": 10.980976168828228,
-  "global_step": 98500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -2764,11 +2764,25 @@
       "eval_samples_per_second": 298.894,
       "eval_steps_per_second": 37.375,
       "step": 98500
     }
   ],
   "max_steps": 134550,
   "num_train_epochs": 15,
-  "total_flos": 6.828350028986436e+17,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": 1.4165735244750977,
   "best_model_checkpoint": "/home/pcjf/CESGA/works/lmodels/models/tiny/checkpoint-98500",
+  "epoch": 11.03678660633106,
+  "global_step": 99000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 298.894,
       "eval_steps_per_second": 37.375,
       "step": 98500
+    },
+    {
+      "epoch": 11.04,
+      "learning_rate": 2.6448903753251582e-05,
+      "loss": 1.4601,
+      "step": 99000
+    },
+    {
+      "epoch": 11.04,
+      "eval_loss": 1.421845555305481,
+      "eval_runtime": 35.8769,
+      "eval_samples_per_second": 320.317,
+      "eval_steps_per_second": 40.054,
+      "step": 99000
     }
   ],
   "max_steps": 134550,
   "num_train_epochs": 15,
+  "total_flos": 6.863007182432229e+17,
   "trial_name": null,
   "trial_params": null
 }

log.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:103ae63eb15642bd84b830bf18d49ff1e4734c3ae7b347dcb11f41f4c2740c49
 size 269468281

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5eb3d7defb1c32bd6fc4a21ab99f020092d22e7be3eb53044a485f9035ce1b7
 size 269468281

runs/Jan19_18-25-54_turing/events.out.tfevents.1674149167.turing.482470.1 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c0f5f5d74aa6bc3a1ff3d46b669ef08cc675b7200a30e3680728954a8ce07510
-size 89549

 version https://git-lfs.github.com/spec/v1
+oid sha256:5ac6e242fb32701c2853e60a0c367c9fdb56bc17ee59cc3d3f6a344a8a448fea
+size 89985