End of training

Files changed (8) hide show

all_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 1.0,
-    "train_loss": 8.709332525719078e-05,
-    "train_runtime": 189.6957,
-    "train_samples": 21538,
-    "train_samples_per_second": 113.54,
-    "train_steps_per_second": 1.777
 }

 {
     "epoch": 1.0,
+    "train_loss": 0.009268463998593412,
+    "train_runtime": 186.2906,
+    "train_samples": 21673,
+    "train_samples_per_second": 116.34,
+    "train_steps_per_second": 1.82
 }

config.json CHANGED Viewed

@@ -51,7 +51,7 @@
     }
   },
   "torch_dtype": "float32",
-  "transformers_version": "4.12.0.dev0",
   "use_cache": true,
   "vocab_size": 32100
 }

     }
   },
   "torch_dtype": "float32",
+  "transformers_version": "4.12.5",
   "use_cache": true,
   "vocab_size": 32100
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6557f7e7707f045eb67eed0b29690171c23fbd92515f5215c978de1af11d2103
 size 891650871

 version https://git-lfs.github.com/spec/v1
+oid sha256:ff4db044f0e2ae34edf783091398f37420df1649eae1f2f0ffaca225f65b7be0
 size 891650871

runs/Nov25_17-40-02_DESKTOP-FPB11SM/1637858565.932426/events.out.tfevents.1637858565.DESKTOP-FPB11SM.22208.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:85f1deba7e0f7476bd25e4b4ac66f543e2ad61febb47dc088bb6f411249f2b16
+size 4740

runs/Nov25_17-40-02_DESKTOP-FPB11SM/events.out.tfevents.1637858565.DESKTOP-FPB11SM.22208.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e9c8127b7bfe608f84667fe18518eea026745ab8c2dc025506fe71a7628370d
+size 5321

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 1.0,
-    "train_loss": 8.709332525719078e-05,
-    "train_runtime": 189.6957,
-    "train_samples": 21538,
-    "train_samples_per_second": 113.54,
-    "train_steps_per_second": 1.777
 }

 {
     "epoch": 1.0,
+    "train_loss": 0.009268463998593412,
+    "train_runtime": 186.2906,
+    "train_samples": 21673,
+    "train_samples_per_second": 116.34,
+    "train_steps_per_second": 1.82
 }

trainer_state.json CHANGED Viewed

@@ -2,60 +2,60 @@
   "best_metric": null,
   "best_model_checkpoint": null,
   "epoch": 1.0,
-  "global_step": 337,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
       "epoch": 0.15,
-      "learning_rate": 4.258160237388724e-05,
-      "loss": 0.0002,
       "step": 50
     },
     {
-      "epoch": 0.3,
-      "learning_rate": 3.516320474777448e-05,
-      "loss": 0.0002,
       "step": 100
     },
     {
-      "epoch": 0.45,
-      "learning_rate": 2.774480712166172e-05,
-      "loss": 0.0,
       "step": 150
     },
     {
       "epoch": 0.59,
-      "learning_rate": 2.0326409495548962e-05,
-      "loss": 0.0001,
       "step": 200
     },
     {
       "epoch": 0.74,
-      "learning_rate": 1.29080118694362e-05,
-      "loss": 0.0,
       "step": 250
     },
     {
-      "epoch": 0.89,
-      "learning_rate": 5.489614243323442e-06,
-      "loss": 0.0,
       "step": 300
     },
     {
       "epoch": 1.0,
-      "step": 337,
-      "total_flos": 2801087359488000.0,
-      "train_loss": 8.709332525719078e-05,
-      "train_runtime": 189.6957,
-      "train_samples_per_second": 113.54,
-      "train_steps_per_second": 1.777
     }
   ],
-  "max_steps": 337,
   "num_train_epochs": 1,
-  "total_flos": 2801087359488000.0,
   "trial_name": null,
   "trial_params": null
 }

   "best_metric": null,
   "best_model_checkpoint": null,
   "epoch": 1.0,
+  "global_step": 339,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
       "epoch": 0.15,
+      "learning_rate": 4.262536873156342e-05,
+      "loss": 0.0544,
       "step": 50
     },
     {
+      "epoch": 0.29,
+      "learning_rate": 3.5250737463126844e-05,
+      "loss": 0.0046,
       "step": 100
     },
     {
+      "epoch": 0.44,
+      "learning_rate": 2.7876106194690264e-05,
+      "loss": 0.0017,
       "step": 150
     },
     {
       "epoch": 0.59,
+      "learning_rate": 2.0501474926253688e-05,
+      "loss": 0.0008,
       "step": 200
     },
     {
       "epoch": 0.74,
+      "learning_rate": 1.3126843657817109e-05,
+      "loss": 0.0003,
       "step": 250
     },
     {
+      "epoch": 0.88,
+      "learning_rate": 5.752212389380531e-06,
+      "loss": 0.0005,
       "step": 300
     },
     {
       "epoch": 1.0,
+      "step": 339,
+      "total_flos": 2741653307243520.0,
+      "train_loss": 0.009268463998593412,
+      "train_runtime": 186.2906,
+      "train_samples_per_second": 116.34,
+      "train_steps_per_second": 1.82
     }
   ],
+  "max_steps": 339,
   "num_train_epochs": 1,
+  "total_flos": 2741653307243520.0,
   "trial_name": null,
   "trial_params": null
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bb7add8ff853cd2132d39756e4551133929cae92cc5bcd1c7db0103a7b3d00e1
 size 2991

 version https://git-lfs.github.com/spec/v1
+oid sha256:b331deea65e8e800146e5b236d9284b85aec2aeed33a1d4d1f8096aa29f4c51a
 size 2991