Training in progress, step 24000

Files changed (11) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2c879f385b422df3fca5228513f3bae4387ed9e62fd092ebca498251ff96dd82
 size 3871543575

 version https://git-lfs.github.com/spec/v1
+oid sha256:b9436f8f8b607b1ee593a8f3b0b8b83e30fe390053f20fd17d06fad5fa1c3800
 size 3871543575

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:24a7fb993881a603ce7c7932d42c04cd7697ed7fbc569bff9d0a019e4b731376
 size 1944201353

 version https://git-lfs.github.com/spec/v1
+oid sha256:1a6ca84a97e8c4a7948040e06ceceb51817c0b2cbd17f232026f4dbe0b459e8f
 size 1944201353

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fdfd1692f8c3e07bd7f0386306b8a4dc7984bed19ffb5f1fb77db39dc898e24a
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:6d8f258a77a5626bb48a10d9b85a8386b171d5dd6f4cd303281f19063ab68e5f
 size 14575

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2a64456a544b4e3b448418c8f8b53a190245445274955bebd8d3b8522bf98ccb
 size 557

 version https://git-lfs.github.com/spec/v1
+oid sha256:f431083eeb6d9fc00bf62f51e90febacbb78f3e6a99dc9fc4278d2be5a055df8
 size 557

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7240fa7db242cb3d6601e7b6ac5c0a2f2bebee276959a658a3c866c5e8a6d292
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:b4a6d62e8eba1babe503704efa95eb56e2c5e9222374877c14b70b7d65166a96
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.5242683834708665,
-  "global_step": 20000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -246,11 +246,59 @@
       "learning_rate": 2.3109751299304977e-05,
       "loss": 1.41,
       "step": 20000
     }
   ],
   "max_steps": 38148,
   "num_train_epochs": 1,
-  "total_flos": 2.203967601635328e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.6291220601650397,
+  "global_step": 24000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.3109751299304977e-05,
       "loss": 1.41,
       "step": 20000
+    },
+    {
+      "epoch": 0.54,
+      "learning_rate": 2.208518091776931e-05,
+      "loss": 1.3994,
+      "step": 20500
+    },
+    {
+      "epoch": 0.55,
+      "learning_rate": 2.1065551895687553e-05,
+      "loss": 1.402,
+      "step": 21000
+    },
+    {
+      "epoch": 0.56,
+      "learning_rate": 2.0054610881655616e-05,
+      "loss": 1.3803,
+      "step": 21500
+    },
+    {
+      "epoch": 0.58,
+      "learning_rate": 1.9050020383592233e-05,
+      "loss": 1.396,
+      "step": 22000
+    },
+    {
+      "epoch": 0.59,
+      "learning_rate": 1.8055516613795243e-05,
+      "loss": 1.3896,
+      "step": 22500
+    },
+    {
+      "epoch": 0.6,
+      "learning_rate": 1.707278550901278e-05,
+      "loss": 1.3721,
+      "step": 23000
+    },
+    {
+      "epoch": 0.62,
+      "learning_rate": 1.610349304833249e-05,
+      "loss": 1.3559,
+      "step": 23500
+    },
+    {
+      "epoch": 0.63,
+      "learning_rate": 1.5149282428923398e-05,
+      "loss": 1.3745,
+      "step": 24000
     }
   ],
   "max_steps": 38148,
   "num_train_epochs": 1,
+  "total_flos": 2.6437433869983744e+16,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6a91745d5c34dd898b0980ec93cf90caddb5b2af7b8791e7a7000ac13519890d
 size 3771

 version https://git-lfs.github.com/spec/v1
+oid sha256:199b3c969edf26c24dbc136ed11ffce7b4ba6fca136ae73bf4ac87b279d10612
 size 3771

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:24a7fb993881a603ce7c7932d42c04cd7697ed7fbc569bff9d0a019e4b731376
 size 1944201353

 version https://git-lfs.github.com/spec/v1
+oid sha256:1a6ca84a97e8c4a7948040e06ceceb51817c0b2cbd17f232026f4dbe0b459e8f
 size 1944201353

runs/Jun18_17-52-03_85d30a282e1b/1687112276.514311/events.out.tfevents.1687112276.85d30a282e1b.283.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc065b4819b65fbe0c37ed9ed822a534caee708e5201bd6110c8792e73e3fc0f
+size 6187

runs/Jun18_17-52-03_85d30a282e1b/events.out.tfevents.1687112276.85d30a282e1b.283.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e58edc503b7e7e09ead300ec65b6ae8e84d0206ee2b89ccb7ed0d3fed326b214
+size 5742

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6a91745d5c34dd898b0980ec93cf90caddb5b2af7b8791e7a7000ac13519890d
 size 3771

 version https://git-lfs.github.com/spec/v1
+oid sha256:199b3c969edf26c24dbc136ed11ffce7b4ba6fca136ae73bf4ac87b279d10612
 size 3771