End of training

Files changed (5) hide show

README.md CHANGED Viewed

@@ -1,13 +1,34 @@
 ---
 license: apache-2.0
 base_model: bert-base-cased
 tags:
 - generated_from_trainer
 datasets:
 - glue
 model-index:
 - name: push-to-hub-test-2
-  results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -15,7 +36,12 @@ should probably proofread and complete it, then remove this comment. -->
 # push-to-hub-test-2
-This model is a fine-tuned version of [bert-base-cased](https://huggingface.co/bert-base-cased) on the glue dataset.
 ## Model description

 ---
+language:
+- en
 license: apache-2.0
 base_model: bert-base-cased
 tags:
 - generated_from_trainer
 datasets:
 - glue
+metrics:
+- accuracy
+- f1
 model-index:
 - name: push-to-hub-test-2
+  results:
+  - task:
+      name: Text Classification
+      type: text-classification
+    dataset:
+      name: GLUE MRPC
+      type: glue
+      config: mrpc
+      split: validation
+      args: mrpc
+    metrics:
+    - name: Accuracy
+      type: accuracy
+      value: 0.8676470588235294
+    - name: F1
+      type: f1
+      value: 0.9078498293515359
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 # push-to-hub-test-2
+This model is a fine-tuned version of [bert-base-cased](https://huggingface.co/bert-base-cased) on the GLUE MRPC dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.6255
+- Accuracy: 0.8676
+- F1: 0.9078
+- Combined Score: 0.8877
 ## Model description

all_results.json CHANGED Viewed

@@ -4,13 +4,13 @@
     "eval_combined_score": 0.8877484440875327,
     "eval_f1": 0.9078498293515359,
     "eval_loss": 0.6254646182060242,
-    "eval_runtime": 0.9668,
     "eval_samples": 408,
-    "eval_samples_per_second": 422.028,
-    "eval_steps_per_second": 26.894,
     "train_loss": 0.29736072982566947,
-    "train_runtime": 72.3445,
     "train_samples": 3668,
-    "train_samples_per_second": 152.106,
-    "train_steps_per_second": 9.538
 }

     "eval_combined_score": 0.8877484440875327,
     "eval_f1": 0.9078498293515359,
     "eval_loss": 0.6254646182060242,
+    "eval_runtime": 0.9827,
     "eval_samples": 408,
+    "eval_samples_per_second": 415.192,
+    "eval_steps_per_second": 26.458,
     "train_loss": 0.29736072982566947,
+    "train_runtime": 69.9797,
     "train_samples": 3668,
+    "train_samples_per_second": 157.246,
+    "train_steps_per_second": 9.86
 }

eval_results.json CHANGED Viewed

@@ -4,8 +4,8 @@
     "eval_combined_score": 0.8877484440875327,
     "eval_f1": 0.9078498293515359,
     "eval_loss": 0.6254646182060242,
-    "eval_runtime": 0.9668,
     "eval_samples": 408,
-    "eval_samples_per_second": 422.028,
-    "eval_steps_per_second": 26.894
 }

     "eval_combined_score": 0.8877484440875327,
     "eval_f1": 0.9078498293515359,
     "eval_loss": 0.6254646182060242,
+    "eval_runtime": 0.9827,
     "eval_samples": 408,
+    "eval_samples_per_second": 415.192,
+    "eval_steps_per_second": 26.458
 }

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 3.0,
     "train_loss": 0.29736072982566947,
-    "train_runtime": 72.3445,
     "train_samples": 3668,
-    "train_samples_per_second": 152.106,
-    "train_steps_per_second": 9.538
 }

 {
     "epoch": 3.0,
     "train_loss": 0.29736072982566947,
+    "train_runtime": 69.9797,
     "train_samples": 3668,
+    "train_samples_per_second": 157.246,
+    "train_steps_per_second": 9.86
 }

trainer_state.json CHANGED Viewed

@@ -18,9 +18,9 @@
       "step": 690,
       "total_flos": 723818513295360.0,
       "train_loss": 0.29736072982566947,
-      "train_runtime": 72.3445,
-      "train_samples_per_second": 152.106,
-      "train_steps_per_second": 9.538
     }
   ],
   "max_steps": 690,

       "step": 690,
       "total_flos": 723818513295360.0,
       "train_loss": 0.29736072982566947,
+      "train_runtime": 69.9797,
+      "train_samples_per_second": 157.246,
+      "train_steps_per_second": 9.86
     }
   ],
   "max_steps": 690,