Training in progress, step 500

Browse files

Files changed (10) hide show

{checkpoint-200 → checkpoint-500}/config.json +0 -0
{checkpoint-200 → checkpoint-500}/optimizer.pt +2 -2
{checkpoint-200 → checkpoint-500}/preprocessor_config.json +0 -0
{checkpoint-200 → checkpoint-500}/pytorch_model.bin +1 -1
{checkpoint-200 → checkpoint-500}/rng_state.pth +1 -1
{checkpoint-200 → checkpoint-500}/scaler.pt +1 -1
{checkpoint-200 → checkpoint-500}/scheduler.pt +1 -1
{checkpoint-200 → checkpoint-500}/trainer_state.json +120 -3
{checkpoint-200 → checkpoint-500}/training_args.bin +0 -0
pytorch_model.bin +1 -1

{checkpoint-200 → checkpoint-500}/config.json RENAMED Viewed

File without changes

{checkpoint-200 → checkpoint-500}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e372713b9b4f08bb894dc870270602df8edb42a297b076384214416e48da7427
-size 2490337361

 version https://git-lfs.github.com/spec/v1
+oid sha256:048f968ba8a4f235f039cc2a3b8618f0d55f48973016df5fcaae601d0b92d784
+size 2490337809

{checkpoint-200 → checkpoint-500}/preprocessor_config.json RENAMED Viewed

File without changes

{checkpoint-200 → checkpoint-500}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fea7f958b25952352273031565944d92f86ac710ce0e0b4b61eb74f30d1f78ad
 size 1262063089

 version https://git-lfs.github.com/spec/v1
+oid sha256:70e8ab1267a52eb4fa82e60a245e4f97d45dfb9f9c4616b7da2a301c9311b7f7
 size 1262063089

{checkpoint-200 → checkpoint-500}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e76fe309ed364f4a44a74766da4dcfb7b318850c8c7c327fc5f82d79d192a224
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:158b5fc43024b846c58cb1ec5967d7e3d1635ecc454a7b9dd1aac7d9ccc8d61e
 size 14503

{checkpoint-200 → checkpoint-500}/scaler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:81203995f0822de6ed51d600e94d6f7d40cd4741b0f277d950b37bbc13d4b61e
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:1c304e72bfea7592d4ddcc6e3b3b1a9bcab2965ed75957d798b3560c75dbe7d8
 size 559

{checkpoint-200 → checkpoint-500}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:de2bc386c3cff1fb864afc8ef94f3bbbfa6c62de3df077be5c634acc882bc912
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:7f844f4edb8fac739b919057d71649ad3c5a779b3699b7f57247e1a115c338a4
 size 623

{checkpoint-200 → checkpoint-500}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.09204924634679554,
-  "global_step": 200,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -84,11 +84,128 @@
       "eval_steps_per_second": 0.781,
       "eval_wer": 1.0,
       "step": 200
     }
   ],
   "max_steps": 6516,
   "num_train_epochs": 3,
-  "total_flos": 3.810397715849134e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.23012311586698883,
+  "global_step": 500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_steps_per_second": 0.781,
       "eval_wer": 1.0,
       "step": 200
+    },
+    {
+      "epoch": 0.1,
+      "learning_rate": 7.403680501174628e-05,
+      "loss": 3.1517,
+      "step": 220
+    },
+    {
+      "epoch": 0.11,
+      "learning_rate": 7.380187940485512e-05,
+      "loss": 3.1617,
+      "step": 240
+    },
+    {
+      "epoch": 0.12,
+      "learning_rate": 7.357870007830852e-05,
+      "loss": 3.2971,
+      "step": 260
+    },
+    {
+      "epoch": 0.13,
+      "learning_rate": 7.334377447141738e-05,
+      "loss": 3.022,
+      "step": 280
+    },
+    {
+      "epoch": 0.14,
+      "learning_rate": 7.312059514487078e-05,
+      "loss": 3.3322,
+      "step": 300
+    },
+    {
+      "epoch": 0.14,
+      "eval_loss": 3.0716073513031006,
+      "eval_runtime": 196.1674,
+      "eval_samples_per_second": 24.688,
+      "eval_steps_per_second": 0.775,
+      "eval_wer": 1.0,
+      "step": 300
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 7.288566953797964e-05,
+      "loss": 2.9964,
+      "step": 320
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 7.265074393108849e-05,
+      "loss": 3.0777,
+      "step": 340
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 7.242756460454189e-05,
+      "loss": 3.2703,
+      "step": 360
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 7.219263899765073e-05,
+      "loss": 3.1161,
+      "step": 380
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 7.195771339075958e-05,
+      "loss": 3.2435,
+      "step": 400
+    },
+    {
+      "epoch": 0.18,
+      "eval_loss": 3.063333034515381,
+      "eval_runtime": 190.5938,
+      "eval_samples_per_second": 25.41,
+      "eval_steps_per_second": 0.798,
+      "eval_wer": 1.0,
+      "step": 400
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 7.172278778386843e-05,
+      "loss": 2.9993,
+      "step": 420
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 7.148786217697727e-05,
+      "loss": 3.0555,
+      "step": 440
+    },
+    {
+      "epoch": 0.21,
+      "learning_rate": 7.126468285043069e-05,
+      "loss": 3.1879,
+      "step": 460
+    },
+    {
+      "epoch": 0.22,
+      "learning_rate": 7.102975724353953e-05,
+      "loss": 2.9861,
+      "step": 480
+    },
+    {
+      "epoch": 0.23,
+      "learning_rate": 7.080657791699295e-05,
+      "loss": 3.0833,
+      "step": 500
+    },
+    {
+      "epoch": 0.23,
+      "eval_loss": 2.9769718647003174,
+      "eval_runtime": 195.2639,
+      "eval_samples_per_second": 24.802,
+      "eval_steps_per_second": 0.778,
+      "eval_wer": 1.0,
+      "step": 500
     }
   ],
   "max_steps": 6516,
   "num_train_epochs": 3,
+  "total_flos": 9.523798230150083e+18,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-200 → checkpoint-500}/training_args.bin RENAMED Viewed

File without changes

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:61b6883c6e02239e2f9a600d8b7a77e2e4821e4fd6b9635280a33cee15944b9e
 size 1262063089

 version https://git-lfs.github.com/spec/v1
+oid sha256:70e8ab1267a52eb4fa82e60a245e4f97d45dfb9f9c4616b7da2a301c9311b7f7
 size 1262063089