Training in progress, step 77336

Browse files

Files changed (8) hide show

last-checkpoint/generation_config.json +1 -0
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +144 -3
pytorch_model.bin +1 -1
runs/Feb07_05-04-07_5214b674e698/events.out.tfevents.1675746342.5214b674e698.342.0 +2 -2

last-checkpoint/generation_config.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "_from_model_config": true,
   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
   "transformers_version": "4.26.0"
 }

   "_from_model_config": true,
   "decoder_start_token_id": 0,
   "eos_token_id": 1,
+  "max_length": 300,
   "pad_token_id": 0,
   "transformers_version": "4.26.0"
 }

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f2992361efcf4770d4c6602bb67d93320a187287e7fc6dc44519cbf03c5dd8d1
 size 2401461637

 version https://git-lfs.github.com/spec/v1
+oid sha256:6df0004473716224f08e7366a4b13550fc06f34aec0352a5c2d2d7d5164597a3
 size 2401461637

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b4071ac5bc82e1943cce385333b946af39ce630c568c0ddebfc504245d7448e1
 size 1200739717

 version https://git-lfs.github.com/spec/v1
+oid sha256:87b0bb2564b2dab9e02aac0e077c1e06181afd486b00577a15c4a5029f68ed7c
 size 1200739717

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e52dd293318f93d0d24ab2680c6a46204bbcb9dee0ba0954189329cd5f7d5e2e
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:d1c41e482802bc97fdd0ddd478f81f890ac7879380e8dd605815c3f44c2761cf
 size 14575

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3c0312d2c26f50db24e7fa24aa7f3be59f0d2b84dcf88829a4f490d4d99de93a
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:60fdcc494b0281edea8ff71092a9259fd16c44c328d0dafd2fc4eb4dda344861
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.9861057391925263,
-  "global_step": 66288,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -798,11 +798,152 @@
       "learning_rate": 1.3454523816607659e-05,
       "loss": 3.013,
       "step": 66000
     }
   ],
   "max_steps": 201666,
   "num_train_epochs": 3,
-  "total_flos": 7.793968305851597e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.150456695724614,
+  "global_step": 77336,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.3454523816607659e-05,
       "loss": 3.013,
       "step": 66000
+    },
+    {
+      "epoch": 0.99,
+      "learning_rate": 1.3404936875824384e-05,
+      "loss": 3.0027,
+      "step": 66500
+    },
+    {
+      "epoch": 1.0,
+      "learning_rate": 1.3355349935041108e-05,
+      "loss": 3.0155,
+      "step": 67000
+    },
+    {
+      "epoch": 1.0,
+      "eval_bleu": 11.298551127218651,
+      "eval_loss": 2.3749005794525146,
+      "eval_runtime": 4929.9601,
+      "eval_samples_per_second": 8.201,
+      "eval_steps_per_second": 0.513,
+      "step": 67222
+    },
+    {
+      "epoch": 1.0,
+      "learning_rate": 1.3305762994257834e-05,
+      "loss": 3.0195,
+      "step": 67500
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 1.3256176053474558e-05,
+      "loss": 2.9924,
+      "step": 68000
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 1.3206589112691284e-05,
+      "loss": 2.997,
+      "step": 68500
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 1.3157002171908007e-05,
+      "loss": 2.9694,
+      "step": 69000
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 1.3107415231124732e-05,
+      "loss": 2.9804,
+      "step": 69500
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 1.3057828290341456e-05,
+      "loss": 2.9879,
+      "step": 70000
+    },
+    {
+      "epoch": 1.05,
+      "learning_rate": 1.3008241349558182e-05,
+      "loss": 2.9919,
+      "step": 70500
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 1.2958654408774906e-05,
+      "loss": 2.9875,
+      "step": 71000
+    },
+    {
+      "epoch": 1.06,
+      "learning_rate": 1.2909067467991632e-05,
+      "loss": 2.9912,
+      "step": 71500
+    },
+    {
+      "epoch": 1.07,
+      "learning_rate": 1.2859480527208354e-05,
+      "loss": 2.974,
+      "step": 72000
+    },
+    {
+      "epoch": 1.08,
+      "learning_rate": 1.280989358642508e-05,
+      "loss": 2.9581,
+      "step": 72500
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 1.2760306645641804e-05,
+      "loss": 2.975,
+      "step": 73000
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 1.271071970485853e-05,
+      "loss": 2.9737,
+      "step": 73500
+    },
+    {
+      "epoch": 1.1,
+      "learning_rate": 1.2661132764075254e-05,
+      "loss": 2.9722,
+      "step": 74000
+    },
+    {
+      "epoch": 1.11,
+      "learning_rate": 1.261154582329198e-05,
+      "loss": 2.9727,
+      "step": 74500
+    },
+    {
+      "epoch": 1.12,
+      "learning_rate": 1.2561958882508702e-05,
+      "loss": 2.9618,
+      "step": 75000
+    },
+    {
+      "epoch": 1.12,
+      "learning_rate": 1.2512371941725428e-05,
+      "loss": 2.9554,
+      "step": 75500
+    },
+    {
+      "epoch": 1.13,
+      "learning_rate": 1.2462785000942152e-05,
+      "loss": 2.961,
+      "step": 76000
+    },
+    {
+      "epoch": 1.14,
+      "learning_rate": 1.2413198060158878e-05,
+      "loss": 2.9627,
+      "step": 76500
+    },
+    {
+      "epoch": 1.15,
+      "learning_rate": 1.2363611119375602e-05,
+      "loss": 2.9896,
+      "step": 77000
     }
   ],
   "max_steps": 201666,
   "num_train_epochs": 3,
+  "total_flos": 9.093214173619814e+16,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b4071ac5bc82e1943cce385333b946af39ce630c568c0ddebfc504245d7448e1
 size 1200739717

 version https://git-lfs.github.com/spec/v1
+oid sha256:87b0bb2564b2dab9e02aac0e077c1e06181afd486b00577a15c4a5029f68ed7c
 size 1200739717

runs/Feb07_05-04-07_5214b674e698/events.out.tfevents.1675746342.5214b674e698.342.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:16d94d99a4243783f2c4751209b7f4a0753cff0f06dbbcb869acc91381ecb224
-size 25141

 version https://git-lfs.github.com/spec/v1
+oid sha256:643354f90e73662cc3dab47e0d1c8ae7366fff16e187d6ca8273a9b221c47a70
+size 28986