Training in progress, step 200000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Dec27_23-39-04_t1v-n-6071ee6f-w-0/events.out.tfevents.1672184365.t1v-n-6071ee6f-w-0.108001.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d137545299ce280839e9660375b0a7ab0faec41723ba68a4216914563feac59d
 size 885325017

 version https://git-lfs.github.com/spec/v1
+oid sha256:43a71e6151adca0181a848ed657b48274701ef87b47b5ef99efa5a58e418e0b9
 size 885325017

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0e7cb21fe7014a2339ef03eb26bae39f944da008eab2b1e49e39c28a524fe382
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:910f4d508b15f4d31159848b7d06b89055f204cf1403cbe37a1a3dbba55627c2
 size 442675755

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b930a1e8f69335ea9febebb5f89a57eab0a63cf76bf0d2e207317b0797c1fd8
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:e2db3ae320a2425a1ef9765c539e85b9ac3e18026db96f43f936e94820322ff1
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b930a1e8f69335ea9febebb5f89a57eab0a63cf76bf0d2e207317b0797c1fd8
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:e2db3ae320a2425a1ef9765c539e85b9ac3e18026db96f43f936e94820322ff1
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b930a1e8f69335ea9febebb5f89a57eab0a63cf76bf0d2e207317b0797c1fd8
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:e2db3ae320a2425a1ef9765c539e85b9ac3e18026db96f43f936e94820322ff1
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b930a1e8f69335ea9febebb5f89a57eab0a63cf76bf0d2e207317b0797c1fd8
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:e2db3ae320a2425a1ef9765c539e85b9ac3e18026db96f43f936e94820322ff1
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b930a1e8f69335ea9febebb5f89a57eab0a63cf76bf0d2e207317b0797c1fd8
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:e2db3ae320a2425a1ef9765c539e85b9ac3e18026db96f43f936e94820322ff1
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b930a1e8f69335ea9febebb5f89a57eab0a63cf76bf0d2e207317b0797c1fd8
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:e2db3ae320a2425a1ef9765c539e85b9ac3e18026db96f43f936e94820322ff1
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b930a1e8f69335ea9febebb5f89a57eab0a63cf76bf0d2e207317b0797c1fd8
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:e2db3ae320a2425a1ef9765c539e85b9ac3e18026db96f43f936e94820322ff1
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b930a1e8f69335ea9febebb5f89a57eab0a63cf76bf0d2e207317b0797c1fd8
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:e2db3ae320a2425a1ef9765c539e85b9ac3e18026db96f43f936e94820322ff1
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:04ad030a150fa0d8eb5e5920300951e9645dc85319159f9dd4f177aff4c5b722
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:be1ccf49f4804619cd7d22b74b595a694a368e629a10492b4089d6536d07bdf2
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.003958,
-  "global_step": 150000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -930,11 +930,319 @@
       "eval_samples_per_second": 476.755,
       "eval_steps_per_second": 3.814,
       "step": 150000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 2.5268224249225544e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.053958,
+  "global_step": 200000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 476.755,
       "eval_steps_per_second": 3.814,
       "step": 150000
+    },
+    {
+      "epoch": 1.0,
+      "learning_rate": 9.723691552302562e-05,
+      "loss": 0.8529,
+      "step": 151000
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 9.718245238567939e-05,
+      "loss": 0.7213,
+      "step": 152000
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 9.712747326859315e-05,
+      "loss": 0.7083,
+      "step": 153000
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 9.707197877300974e-05,
+      "loss": 0.8147,
+      "step": 154000
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 9.701596950580806e-05,
+      "loss": 0.874,
+      "step": 155000
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 9.695944607949649e-05,
+      "loss": 0.8637,
+      "step": 156000
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 9.690240911220618e-05,
+      "loss": 0.7201,
+      "step": 157000
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 9.684485922768422e-05,
+      "loss": 0.6845,
+      "step": 158000
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 9.6786797055287e-05,
+      "loss": 0.8199,
+      "step": 159000
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 9.672822322997305e-05,
+      "loss": 0.872,
+      "step": 160000
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 9.66691383922964e-05,
+      "loss": 0.8647,
+      "step": 161000
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 9.660954318839933e-05,
+      "loss": 0.6884,
+      "step": 162000
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 9.654943827000548e-05,
+      "loss": 0.7121,
+      "step": 163000
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 9.648882429441257e-05,
+      "loss": 0.8052,
+      "step": 164000
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 9.642770192448536e-05,
+      "loss": 0.8746,
+      "step": 165000
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 9.636607182864827e-05,
+      "loss": 0.8377,
+      "step": 166000
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 9.630393468087818e-05,
+      "loss": 0.7194,
+      "step": 167000
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 9.624129116069694e-05,
+      "loss": 0.7,
+      "step": 168000
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 9.617814195316411e-05,
+      "loss": 0.8013,
+      "step": 169000
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 9.611448774886924e-05,
+      "loss": 0.8651,
+      "step": 170000
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 9.605032924392457e-05,
+      "loss": 0.8531,
+      "step": 171000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 9.598566713995718e-05,
+      "loss": 0.7139,
+      "step": 172000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 9.59205021441015e-05,
+      "loss": 0.682,
+      "step": 173000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 9.58548349689915e-05,
+      "loss": 0.8036,
+      "step": 174000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 9.578866633275288e-05,
+      "loss": 0.8639,
+      "step": 175000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 9.572199695899522e-05,
+      "loss": 0.8518,
+      "step": 176000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 9.565482757680415e-05,
+      "loss": 0.686,
+      "step": 177000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 9.558715892073323e-05,
+      "loss": 0.7089,
+      "step": 178000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 9.551899173079607e-05,
+      "loss": 0.7906,
+      "step": 179000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 9.545032675245813e-05,
+      "loss": 0.8673,
+      "step": 180000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 9.538116473662861e-05,
+      "loss": 0.8238,
+      "step": 181000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 9.531150643965223e-05,
+      "loss": 0.7204,
+      "step": 182000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 9.524135262330098e-05,
+      "loss": 0.6934,
+      "step": 183000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 9.517070405476575e-05,
+      "loss": 0.7844,
+      "step": 184000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 9.509956150664796e-05,
+      "loss": 0.8557,
+      "step": 185000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 9.502792575695112e-05,
+      "loss": 0.845,
+      "step": 186000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 9.49557975890723e-05,
+      "loss": 0.712,
+      "step": 187000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 9.488317779179361e-05,
+      "loss": 0.6772,
+      "step": 188000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 9.481006715927351e-05,
+      "loss": 0.7856,
+      "step": 189000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 9.473646649103818e-05,
+      "loss": 0.8578,
+      "step": 190000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 9.46623765919727e-05,
+      "loss": 0.8401,
+      "step": 191000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 9.458779827231237e-05,
+      "loss": 0.6855,
+      "step": 192000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 9.451273234763371e-05,
+      "loss": 0.7043,
+      "step": 193000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 9.443717963884569e-05,
+      "loss": 0.7758,
+      "step": 194000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 9.43611409721806e-05,
+      "loss": 0.8624,
+      "step": 195000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 9.428461717918511e-05,
+      "loss": 0.8132,
+      "step": 196000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 9.420760909671118e-05,
+      "loss": 0.7198,
+      "step": 197000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 9.413011756690685e-05,
+      "loss": 0.6865,
+      "step": 198000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 9.405214343720707e-05,
+      "loss": 0.7701,
+      "step": 199000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 9.397368756032445e-05,
+      "loss": 0.847,
+      "step": 200000
+    },
+    {
+      "epoch": 1.05,
+      "eval_loss": 0.5953904390335083,
+      "eval_runtime": 10.2072,
+      "eval_samples_per_second": 489.853,
+      "eval_steps_per_second": 3.919,
+      "step": 200000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 3.3690923552137544e+18,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0e7cb21fe7014a2339ef03eb26bae39f944da008eab2b1e49e39c28a524fe382
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:910f4d508b15f4d31159848b7d06b89055f204cf1403cbe37a1a3dbba55627c2
 size 442675755

runs/Dec27_23-39-04_t1v-n-6071ee6f-w-0/events.out.tfevents.1672184365.t1v-n-6071ee6f-w-0.108001.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1f249865bf547d027f4d3894cc616ba1f1d077c80f07039ba19c5ac201f5519c
-size 28561

 version https://git-lfs.github.com/spec/v1
+oid sha256:a61f7b04d7b7dbb2f80530083396fff89007d8e29ecbe2e0bd1c6fb0f35f9180
+size 36837