Training in progress, step 850000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Dec27_23-39-04_t1v-n-6071ee6f-w-0/events.out.tfevents.1672184365.t1v-n-6071ee6f-w-0.108001.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:396f7233851d0252630541cbdc3f45391c08c17bdbff96436a76285b6d19be4c
 size 885325017

 version https://git-lfs.github.com/spec/v1
+oid sha256:08f951759775273acca27a12ea950a11bbfb4e3e81edcf7e13a2e38e65ad7d75
 size 885325017

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:247d11956ffd5e5b235ed7c5dc3217f08d97dab23bcfcd7bacfd90be0849a0b4
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:164a1a0c14af3ddfe09b60b80146afabdba18c1085ddf41902e33cae32b815cd
 size 442675755

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73dd12a1067d4f7e0c1b9f55d05f7b43980d4da15b85e60a9ba59576295646d4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73dd12a1067d4f7e0c1b9f55d05f7b43980d4da15b85e60a9ba59576295646d4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73dd12a1067d4f7e0c1b9f55d05f7b43980d4da15b85e60a9ba59576295646d4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73dd12a1067d4f7e0c1b9f55d05f7b43980d4da15b85e60a9ba59576295646d4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73dd12a1067d4f7e0c1b9f55d05f7b43980d4da15b85e60a9ba59576295646d4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73dd12a1067d4f7e0c1b9f55d05f7b43980d4da15b85e60a9ba59576295646d4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73dd12a1067d4f7e0c1b9f55d05f7b43980d4da15b85e60a9ba59576295646d4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73dd12a1067d4f7e0c1b9f55d05f7b43980d4da15b85e60a9ba59576295646d4
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:39f2e58dacfd68a9f8da2b5898b22122b823c7de2a9055616202e36287f328f4
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:50e51b9224ded3ddffee57f26ec45414409de0232579ddafb7f3e083076fa4c5
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:adedebe0cc7e07de957a9e2967d6e9c3934a9fdca3245f46a29d125e5e36192e
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 5.06979,
-  "global_step": 800000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -4934,11 +4934,319 @@
       "eval_samples_per_second": 347.766,
       "eval_steps_per_second": 2.782,
       "step": 800000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 1.3476382054903972e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 5.11979,
+  "global_step": 850000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 347.766,
       "eval_steps_per_second": 2.782,
       "step": 800000
+    },
+    {
+      "epoch": 5.07,
+      "learning_rate": 1.0441632244932237e-05,
+      "loss": 0.618,
+      "step": 801000
+    },
+    {
+      "epoch": 5.07,
+      "learning_rate": 1.0340722563656107e-05,
+      "loss": 0.5785,
+      "step": 802000
+    },
+    {
+      "epoch": 5.07,
+      "learning_rate": 1.0240246589884044e-05,
+      "loss": 0.6103,
+      "step": 803000
+    },
+    {
+      "epoch": 5.07,
+      "learning_rate": 1.0140205422405214e-05,
+      "loss": 0.7324,
+      "step": 804000
+    },
+    {
+      "epoch": 5.07,
+      "learning_rate": 1.0040600155253765e-05,
+      "loss": 0.7056,
+      "step": 805000
+    },
+    {
+      "epoch": 5.08,
+      "learning_rate": 9.941431877696955e-06,
+      "loss": 0.6092,
+      "step": 806000
+    },
+    {
+      "epoch": 5.08,
+      "learning_rate": 9.842701674223187e-06,
+      "loss": 0.5889,
+      "step": 807000
+    },
+    {
+      "epoch": 5.08,
+      "learning_rate": 9.744410624530148e-06,
+      "loss": 0.6145,
+      "step": 808000
+    },
+    {
+      "epoch": 5.08,
+      "learning_rate": 9.646559803512994e-06,
+      "loss": 0.7272,
+      "step": 809000
+    },
+    {
+      "epoch": 5.08,
+      "learning_rate": 9.549150281252633e-06,
+      "loss": 0.6878,
+      "step": 810000
+    },
+    {
+      "epoch": 5.08,
+      "learning_rate": 9.452183123004e-06,
+      "loss": 0.6375,
+      "step": 811000
+    },
+    {
+      "epoch": 5.08,
+      "learning_rate": 9.355659389184396e-06,
+      "loss": 0.5797,
+      "step": 812000
+    },
+    {
+      "epoch": 5.08,
+      "learning_rate": 9.259580135361929e-06,
+      "loss": 0.6181,
+      "step": 813000
+    },
+    {
+      "epoch": 5.08,
+      "learning_rate": 9.163946412243896e-06,
+      "loss": 0.7022,
+      "step": 814000
+    },
+    {
+      "epoch": 5.08,
+      "learning_rate": 9.068759265665384e-06,
+      "loss": 0.7195,
+      "step": 815000
+    },
+    {
+      "epoch": 5.09,
+      "learning_rate": 8.974019736577777e-06,
+      "loss": 0.6206,
+      "step": 816000
+    },
+    {
+      "epoch": 5.09,
+      "learning_rate": 8.879728861037384e-06,
+      "loss": 0.5827,
+      "step": 817000
+    },
+    {
+      "epoch": 5.09,
+      "learning_rate": 8.785887670194138e-06,
+      "loss": 0.5984,
+      "step": 818000
+    },
+    {
+      "epoch": 5.09,
+      "learning_rate": 8.692497190280224e-06,
+      "loss": 0.7331,
+      "step": 819000
+    },
+    {
+      "epoch": 5.09,
+      "learning_rate": 8.599558442598998e-06,
+      "loss": 0.701,
+      "step": 820000
+    },
+    {
+      "epoch": 5.09,
+      "learning_rate": 8.507072443513702e-06,
+      "loss": 0.6137,
+      "step": 821000
+    },
+    {
+      "epoch": 5.09,
+      "learning_rate": 8.415040204436426e-06,
+      "loss": 0.5866,
+      "step": 822000
+    },
+    {
+      "epoch": 5.09,
+      "learning_rate": 8.323462731816961e-06,
+      "loss": 0.6116,
+      "step": 823000
+    },
+    {
+      "epoch": 5.09,
+      "learning_rate": 8.232341027131885e-06,
+      "loss": 0.7246,
+      "step": 824000
+    },
+    {
+      "epoch": 5.09,
+      "learning_rate": 8.141676086873572e-06,
+      "loss": 0.6898,
+      "step": 825000
+    },
+    {
+      "epoch": 5.1,
+      "learning_rate": 8.051468902539272e-06,
+      "loss": 0.639,
+      "step": 826000
+    },
+    {
+      "epoch": 5.1,
+      "learning_rate": 7.96172046062032e-06,
+      "loss": 0.582,
+      "step": 827000
+    },
+    {
+      "epoch": 5.1,
+      "learning_rate": 7.872431742591268e-06,
+      "loss": 0.6104,
+      "step": 828000
+    },
+    {
+      "epoch": 5.1,
+      "learning_rate": 7.783603724899257e-06,
+      "loss": 0.7017,
+      "step": 829000
+    },
+    {
+      "epoch": 5.1,
+      "learning_rate": 7.695237378953223e-06,
+      "loss": 0.7198,
+      "step": 830000
+    },
+    {
+      "epoch": 5.1,
+      "learning_rate": 7.607333671113409e-06,
+      "loss": 0.6212,
+      "step": 831000
+    },
+    {
+      "epoch": 5.1,
+      "learning_rate": 7.519893562680663e-06,
+      "loss": 0.5858,
+      "step": 832000
+    },
+    {
+      "epoch": 5.1,
+      "learning_rate": 7.432918009885997e-06,
+      "loss": 0.5894,
+      "step": 833000
+    },
+    {
+      "epoch": 5.1,
+      "learning_rate": 7.3464079638801365e-06,
+      "loss": 0.7322,
+      "step": 834000
+    },
+    {
+      "epoch": 5.1,
+      "learning_rate": 7.260364370723044e-06,
+      "loss": 0.6982,
+      "step": 835000
+    },
+    {
+      "epoch": 5.11,
+      "learning_rate": 7.174788171373731e-06,
+      "loss": 0.6199,
+      "step": 836000
+    },
+    {
+      "epoch": 5.11,
+      "learning_rate": 7.089680301679752e-06,
+      "loss": 0.5853,
+      "step": 837000
+    },
+    {
+      "epoch": 5.11,
+      "learning_rate": 7.005041692367154e-06,
+      "loss": 0.6058,
+      "step": 838000
+    },
+    {
+      "epoch": 5.11,
+      "learning_rate": 6.92087326903022e-06,
+      "loss": 0.7226,
+      "step": 839000
+    },
+    {
+      "epoch": 5.11,
+      "learning_rate": 6.837175952121306e-06,
+      "loss": 0.6915,
+      "step": 840000
+    },
+    {
+      "epoch": 5.11,
+      "learning_rate": 6.753950656940905e-06,
+      "loss": 0.6411,
+      "step": 841000
+    },
+    {
+      "epoch": 5.11,
+      "learning_rate": 6.671198293627479e-06,
+      "loss": 0.5828,
+      "step": 842000
+    },
+    {
+      "epoch": 5.11,
+      "learning_rate": 6.588919767147639e-06,
+      "loss": 0.6022,
+      "step": 843000
+    },
+    {
+      "epoch": 5.11,
+      "learning_rate": 6.5071159772861436e-06,
+      "loss": 0.7013,
+      "step": 844000
+    },
+    {
+      "epoch": 5.11,
+      "learning_rate": 6.425787818636131e-06,
+      "loss": 0.7207,
+      "step": 845000
+    },
+    {
+      "epoch": 5.12,
+      "learning_rate": 6.344936180589351e-06,
+      "loss": 0.6242,
+      "step": 846000
+    },
+    {
+      "epoch": 5.12,
+      "learning_rate": 6.264561947326331e-06,
+      "loss": 0.5877,
+      "step": 847000
+    },
+    {
+      "epoch": 5.12,
+      "learning_rate": 6.184665997806832e-06,
+      "loss": 0.5805,
+      "step": 848000
+    },
+    {
+      "epoch": 5.12,
+      "learning_rate": 6.1052492057601275e-06,
+      "loss": 0.7306,
+      "step": 849000
+    },
+    {
+      "epoch": 5.12,
+      "learning_rate": 6.026312439675552e-06,
+      "loss": 0.6988,
+      "step": 850000
+    },
+    {
+      "epoch": 5.12,
+      "eval_loss": 0.4753837287425995,
+      "eval_runtime": 10.2925,
+      "eval_samples_per_second": 485.791,
+      "eval_steps_per_second": 3.886,
+      "step": 850000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 1.4318651985195172e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:247d11956ffd5e5b235ed7c5dc3217f08d97dab23bcfcd7bacfd90be0849a0b4
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:164a1a0c14af3ddfe09b60b80146afabdba18c1085ddf41902e33cae32b815cd
 size 442675755

runs/Dec27_23-39-04_t1v-n-6071ee6f-w-0/events.out.tfevents.1672184365.t1v-n-6071ee6f-w-0.108001.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aed0691fe9a810a5e9cc3ca8fa6afcdfb5800ccd5417271908269435cadc88ea
-size 136149

 version https://git-lfs.github.com/spec/v1
+oid sha256:e52cdc8630d544095f08a1e0936e12cfe05b25bfc9effb63eb623b39cfd3cf76
+size 144425