Training in progress, step 500

Browse files

Files changed (10) hide show

{checkpoint-200 → checkpoint-500}/config.json +0 -0
{checkpoint-200 → checkpoint-500}/optimizer.pt +2 -2
{checkpoint-200 → checkpoint-500}/preprocessor_config.json +0 -0
{checkpoint-200 → checkpoint-500}/pytorch_model.bin +1 -1
{checkpoint-200 → checkpoint-500}/rng_state.pth +1 -1
{checkpoint-200 → checkpoint-500}/scaler.pt +1 -1
{checkpoint-200 → checkpoint-500}/scheduler.pt +1 -1
{checkpoint-200 → checkpoint-500}/trainer_state.json +120 -3
{checkpoint-200 → checkpoint-500}/training_args.bin +0 -0
pytorch_model.bin +1 -1

{checkpoint-200 → checkpoint-500}/config.json RENAMED Viewed

File without changes

{checkpoint-200 → checkpoint-500}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a972e696459b016bbc3aa28c954288fe7d65723673c7320476f0145a391b0440
-size 2490337361

 version https://git-lfs.github.com/spec/v1
+oid sha256:f4f451d7dca685dc733896a3b9dde8e1707a70872842fb140a7b1b2bc09dc86e
+size 2490337809

{checkpoint-200 → checkpoint-500}/preprocessor_config.json RENAMED Viewed

File without changes

{checkpoint-200 → checkpoint-500}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3abb902c24b9b514e6979e814143734f3ac477116b25bc616e937ac37aa386b6
 size 1262063089

 version https://git-lfs.github.com/spec/v1
+oid sha256:ee400442c70fe28b4032830f08f4c31605f74d5b5778895b5f30b7cad432bdcd
 size 1262063089

{checkpoint-200 → checkpoint-500}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:85ca3e1865dd0f1bb02258869eab1dac68ed8a3dc9fd620878973f94cd7d1990
 size 14567

 version https://git-lfs.github.com/spec/v1
+oid sha256:60bd99fb8f131eb1ec63d9b9eee304bd3aa49c3b43a3a12613b8de4c1d42c4c6
 size 14567

{checkpoint-200 → checkpoint-500}/scaler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cb6982c29cd162f49aeb531674acf574eccd46a8f556bec596040d7c3b95200a
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:4fa4c7be44c959599b8b43bb9bc3371e9e4e5bbc5758b3ab5afcccfda3e72e67
 size 559

{checkpoint-200 → checkpoint-500}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:812e7669c0071d762b7ab2054d1e4ba7a23692696045f03436f670d0f378252b
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:536ace7f76d669d6713c8de85eb8de0ed71bdc66a4ba89707e46295a79ac66a8
 size 623

{checkpoint-200 → checkpoint-500}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.19672131147541,
-  "global_step": 200,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -84,11 +84,128 @@
       "eval_steps_per_second": 0.79,
       "eval_wer": 1.0,
       "step": 200
     }
   ],
   "max_steps": 4550,
   "num_train_epochs": 50,
-  "total_flos": 3.115318423228506e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 5.491803278688525,
+  "global_step": 500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_steps_per_second": 0.79,
       "eval_wer": 1.0,
       "step": 200
+    },
+    {
+      "epoch": 2.42,
+      "learning_rate": 2.75e-05,
+      "loss": 3.079,
+      "step": 220
+    },
+    {
+      "epoch": 2.63,
+      "learning_rate": 3e-05,
+      "loss": 3.0677,
+      "step": 240
+    },
+    {
+      "epoch": 2.85,
+      "learning_rate": 3.2500000000000004e-05,
+      "loss": 3.0656,
+      "step": 260
+    },
+    {
+      "epoch": 3.08,
+      "learning_rate": 3.5000000000000004e-05,
+      "loss": 3.1463,
+      "step": 280
+    },
+    {
+      "epoch": 3.3,
+      "learning_rate": 3.75e-05,
+      "loss": 3.0573,
+      "step": 300
+    },
+    {
+      "epoch": 3.3,
+      "eval_loss": 3.0614514350891113,
+      "eval_runtime": 194.36,
+      "eval_samples_per_second": 24.918,
+      "eval_steps_per_second": 0.782,
+      "eval_wer": 1.0,
+      "step": 300
+    },
+    {
+      "epoch": 3.51,
+      "learning_rate": 4e-05,
+      "loss": 3.0511,
+      "step": 320
+    },
+    {
+      "epoch": 3.73,
+      "learning_rate": 4.25e-05,
+      "loss": 3.0358,
+      "step": 340
+    },
+    {
+      "epoch": 3.95,
+      "learning_rate": 4.4999999999999996e-05,
+      "loss": 3.0416,
+      "step": 360
+    },
+    {
+      "epoch": 4.17,
+      "learning_rate": 4.75e-05,
+      "loss": 3.1053,
+      "step": 380
+    },
+    {
+      "epoch": 4.39,
+      "learning_rate": 5e-05,
+      "loss": 3.0314,
+      "step": 400
+    },
+    {
+      "epoch": 4.39,
+      "eval_loss": 3.0990231037139893,
+      "eval_runtime": 198.3688,
+      "eval_samples_per_second": 24.414,
+      "eval_steps_per_second": 0.766,
+      "eval_wer": 1.0,
+      "step": 400
+    },
+    {
+      "epoch": 4.61,
+      "learning_rate": 5.25e-05,
+      "loss": 3.0309,
+      "step": 420
+    },
+    {
+      "epoch": 4.83,
+      "learning_rate": 5.5e-05,
+      "loss": 3.0259,
+      "step": 440
+    },
+    {
+      "epoch": 5.05,
+      "learning_rate": 5.75e-05,
+      "loss": 3.0998,
+      "step": 460
+    },
+    {
+      "epoch": 5.27,
+      "learning_rate": 6e-05,
+      "loss": 3.0152,
+      "step": 480
+    },
+    {
+      "epoch": 5.49,
+      "learning_rate": 6.25e-05,
+      "loss": 3.0129,
+      "step": 500
+    },
+    {
+      "epoch": 5.49,
+      "eval_loss": 3.039973497390747,
+      "eval_runtime": 190.8567,
+      "eval_samples_per_second": 25.375,
+      "eval_steps_per_second": 0.796,
+      "eval_wer": 1.0,
+      "step": 500
     }
   ],
   "max_steps": 4550,
   "num_train_epochs": 50,
+  "total_flos": 7.741689365780442e+18,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-200 → checkpoint-500}/training_args.bin RENAMED Viewed

File without changes

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:28c7e3ec36d37a20298023cfa6ac730ae02e82d170ef8859ec5740936e2bc809
 size 1262063089

 version https://git-lfs.github.com/spec/v1
+oid sha256:ee400442c70fe28b4032830f08f4c31605f74d5b5778895b5f30b7cad432bdcd
 size 1262063089