Training in progress, step 1000000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Nov28_12-08-26_t1v-n-7cb529b4-w-0/events.out.tfevents.1669637379.t1v-n-7cb529b4-w-0.2625564.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f96d8734fc67059a7520a3a1a9d2a55a3e6d098043a6c6cd90a1b6f91f56d860
 size 2841350745

 version https://git-lfs.github.com/spec/v1
+oid sha256:3e9cfc0cf0e4ebfef38df44339a78495c871dc4fdb1b15bf66baf5551245fcab
 size 2841350745

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c039c129759ed5638ee7f9058c69171bd7245d4934386b8e9f5f3d9e2f97c3f5
 size 1420697771

 version https://git-lfs.github.com/spec/v1
+oid sha256:c0a529311e7b73b1544a6d34e823d88935fc28967cab28dfe3641c41ef9d9245
 size 1420697771

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d905a073e26a85b5b79ade0d20d3463a694fd12691c67edaafb418c1aa37ae21
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:8033b5759c03f0fdee51e437a0c23c3a85f9badbcb2e5f68cd55e6d2383e5577
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39eec6df7074d0a0eeedc59f33d9f00406ad61372a26441a57b7bb31d11113c8
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:6ba26c1d82afce467f99f1dd703268570999f7477616467ac56e429a68fb1d41
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39eec6df7074d0a0eeedc59f33d9f00406ad61372a26441a57b7bb31d11113c8
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:6ba26c1d82afce467f99f1dd703268570999f7477616467ac56e429a68fb1d41
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d905a073e26a85b5b79ade0d20d3463a694fd12691c67edaafb418c1aa37ae21
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:8033b5759c03f0fdee51e437a0c23c3a85f9badbcb2e5f68cd55e6d2383e5577
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e0f01b76b5b2a9fe316619f2bfc48a18372e61d5c4e211addfae83ec24a7913
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:831d0b332f86a08639c5540d922d6f7f898fe0e329f753536e820fa510124211
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39eec6df7074d0a0eeedc59f33d9f00406ad61372a26441a57b7bb31d11113c8
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:6ba26c1d82afce467f99f1dd703268570999f7477616467ac56e429a68fb1d41
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d905a073e26a85b5b79ade0d20d3463a694fd12691c67edaafb418c1aa37ae21
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:8033b5759c03f0fdee51e437a0c23c3a85f9badbcb2e5f68cd55e6d2383e5577
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e0f01b76b5b2a9fe316619f2bfc48a18372e61d5c4e211addfae83ec24a7913
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:831d0b332f86a08639c5540d922d6f7f898fe0e329f753536e820fa510124211
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc2c2c8416f63b11e9c82d6dac05baa6ad73177ac658621e099b23ff71f2f801
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:906bc3ed48818cc1785b6a98c1e064532a322520b99cdf458cfd827674d9b7ec
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.415955,
-  "global_step": 950000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -5858,11 +5858,319 @@
       "eval_samples_per_second": 254.526,
       "eval_steps_per_second": 3.996,
       "step": 950000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 2.8335390155073257e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.4659550000000001,
+  "global_step": 1000000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 254.526,
       "eval_steps_per_second": 3.996,
       "step": 950000
+    },
+    {
+      "epoch": 1.42,
+      "learning_rate": 6.549893279788277e-07,
+      "loss": 0.7946,
+      "step": 951000
+    },
+    {
+      "epoch": 1.42,
+      "learning_rate": 6.285834552247128e-07,
+      "loss": 0.8071,
+      "step": 952000
+    },
+    {
+      "epoch": 1.42,
+      "learning_rate": 6.027175003719354e-07,
+      "loss": 0.8073,
+      "step": 953000
+    },
+    {
+      "epoch": 1.42,
+      "learning_rate": 5.773917462864264e-07,
+      "loss": 0.8005,
+      "step": 954000
+    },
+    {
+      "epoch": 1.42,
+      "learning_rate": 5.526064699265753e-07,
+      "loss": 0.8143,
+      "step": 955000
+    },
+    {
+      "epoch": 1.42,
+      "learning_rate": 5.283619423401998e-07,
+      "loss": 0.8085,
+      "step": 956000
+    },
+    {
+      "epoch": 1.42,
+      "learning_rate": 5.046584286615697e-07,
+      "loss": 0.8065,
+      "step": 957000
+    },
+    {
+      "epoch": 1.42,
+      "learning_rate": 4.814961881085045e-07,
+      "loss": 0.7965,
+      "step": 958000
+    },
+    {
+      "epoch": 1.42,
+      "learning_rate": 4.5887547397955864e-07,
+      "loss": 0.7935,
+      "step": 959000
+    },
+    {
+      "epoch": 1.43,
+      "learning_rate": 4.367965336512403e-07,
+      "loss": 0.8058,
+      "step": 960000
+    },
+    {
+      "epoch": 1.43,
+      "learning_rate": 4.1525960857530243e-07,
+      "loss": 0.8087,
+      "step": 961000
+    },
+    {
+      "epoch": 1.43,
+      "learning_rate": 3.9426493427611177e-07,
+      "loss": 0.8059,
+      "step": 962000
+    },
+    {
+      "epoch": 1.43,
+      "learning_rate": 3.738127403480507e-07,
+      "loss": 0.8112,
+      "step": 963000
+    },
+    {
+      "epoch": 1.43,
+      "learning_rate": 3.5390325045304706e-07,
+      "loss": 0.8136,
+      "step": 964000
+    },
+    {
+      "epoch": 1.43,
+      "learning_rate": 3.3453668231809286e-07,
+      "loss": 0.8115,
+      "step": 965000
+    },
+    {
+      "epoch": 1.43,
+      "learning_rate": 3.157132477328628e-07,
+      "loss": 0.7955,
+      "step": 966000
+    },
+    {
+      "epoch": 1.43,
+      "learning_rate": 2.9743315254743833e-07,
+      "loss": 0.8069,
+      "step": 967000
+    },
+    {
+      "epoch": 1.43,
+      "learning_rate": 2.796965966699927e-07,
+      "loss": 0.8109,
+      "step": 968000
+    },
+    {
+      "epoch": 1.43,
+      "learning_rate": 2.625037740646763e-07,
+      "loss": 0.8081,
+      "step": 969000
+    },
+    {
+      "epoch": 1.44,
+      "learning_rate": 2.458548727494292e-07,
+      "loss": 0.8169,
+      "step": 970000
+    },
+    {
+      "epoch": 1.44,
+      "learning_rate": 2.2975007479397738e-07,
+      "loss": 0.8193,
+      "step": 971000
+    },
+    {
+      "epoch": 1.44,
+      "learning_rate": 2.1418955631781202e-07,
+      "loss": 0.8084,
+      "step": 972000
+    },
+    {
+      "epoch": 1.44,
+      "learning_rate": 1.9917348748826335e-07,
+      "loss": 0.7984,
+      "step": 973000
+    },
+    {
+      "epoch": 1.44,
+      "learning_rate": 1.847020325186577e-07,
+      "loss": 0.7909,
+      "step": 974000
+    },
+    {
+      "epoch": 1.44,
+      "learning_rate": 1.7077534966650766e-07,
+      "loss": 0.7789,
+      "step": 975000
+    },
+    {
+      "epoch": 1.44,
+      "learning_rate": 1.5739359123178587e-07,
+      "loss": 0.8053,
+      "step": 976000
+    },
+    {
+      "epoch": 1.44,
+      "learning_rate": 1.4455690355525964e-07,
+      "loss": 0.8,
+      "step": 977000
+    },
+    {
+      "epoch": 1.44,
+      "learning_rate": 1.3226542701689215e-07,
+      "loss": 0.7943,
+      "step": 978000
+    },
+    {
+      "epoch": 1.44,
+      "learning_rate": 1.2051929603428825e-07,
+      "loss": 0.7907,
+      "step": 979000
+    },
+    {
+      "epoch": 1.45,
+      "learning_rate": 1.0931863906127327e-07,
+      "loss": 0.7951,
+      "step": 980000
+    },
+    {
+      "epoch": 1.45,
+      "learning_rate": 9.866357858642205e-08,
+      "loss": 0.798,
+      "step": 981000
+    },
+    {
+      "epoch": 1.45,
+      "learning_rate": 8.855423113177664e-08,
+      "loss": 0.8057,
+      "step": 982000
+    },
+    {
+      "epoch": 1.45,
+      "learning_rate": 7.899070725153613e-08,
+      "loss": 0.7998,
+      "step": 983000
+    },
+    {
+      "epoch": 1.45,
+      "learning_rate": 6.997311153086883e-08,
+      "loss": 0.7946,
+      "step": 984000
+    },
+    {
+      "epoch": 1.45,
+      "learning_rate": 6.150154258476315e-08,
+      "loss": 0.8003,
+      "step": 985000
+    },
+    {
+      "epoch": 1.45,
+      "learning_rate": 5.3576093056922906e-08,
+      "loss": 0.8032,
+      "step": 986000
+    },
+    {
+      "epoch": 1.45,
+      "learning_rate": 4.619684961881254e-08,
+      "loss": 0.7832,
+      "step": 987000
+    },
+    {
+      "epoch": 1.45,
+      "learning_rate": 3.936389296864129e-08,
+      "loss": 0.7957,
+      "step": 988000
+    },
+    {
+      "epoch": 1.45,
+      "learning_rate": 3.3077297830541584e-08,
+      "loss": 0.8173,
+      "step": 989000
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 2.7337132953697554e-08,
+      "loss": 0.804,
+      "step": 990000
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 2.214346111164556e-08,
+      "loss": 0.7921,
+      "step": 991000
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 1.749633910153592e-08,
+      "loss": 0.8102,
+      "step": 992000
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 1.3395817743561134e-08,
+      "loss": 0.8074,
+      "step": 993000
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 9.841941880361916e-09,
+      "loss": 0.7963,
+      "step": 994000
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 6.834750376549792e-09,
+      "loss": 0.8013,
+      "step": 995000
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 4.3742761183018784e-09,
+      "loss": 0.8027,
+      "step": 996000
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 2.4605460129556445e-09,
+      "loss": 0.8073,
+      "step": 997000
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 1.0935809887702154e-09,
+      "loss": 0.8076,
+      "step": 998000
+    },
+    {
+      "epoch": 1.46,
+      "learning_rate": 2.7339599464326627e-10,
+      "loss": 0.8206,
+      "step": 999000
+    },
+    {
+      "epoch": 1.47,
+      "learning_rate": 0.0,
+      "loss": 0.8031,
+      "step": 1000000
+    },
+    {
+      "epoch": 1.47,
+      "eval_loss": 0.6313675045967102,
+      "eval_runtime": 39.6188,
+      "eval_samples_per_second": 252.405,
+      "eval_steps_per_second": 3.963,
+      "step": 1000000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 2.9826726086567657e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c039c129759ed5638ee7f9058c69171bd7245d4934386b8e9f5f3d9e2f97c3f5
 size 1420697771

 version https://git-lfs.github.com/spec/v1
+oid sha256:c0a529311e7b73b1544a6d34e823d88935fc28967cab28dfe3641c41ef9d9245
 size 1420697771

runs/Nov28_12-08-26_t1v-n-7cb529b4-w-0/events.out.tfevents.1669637379.t1v-n-7cb529b4-w-0.2625564.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:493fc665d441f15fde8f94763d18c8118b77659275454b81f3579d6c942c6aed
-size 69942

 version https://git-lfs.github.com/spec/v1
+oid sha256:a5f35d161162d9608ce252e1359e6edf6ab56d695e1627810f9dd07c69d886f5
+size 78218