training completed[dev]: 512 128

Browse files

Files changed (4) hide show

README.md +18 -18
all_results.json +6 -6
runs/Apr06_01-17-41_b7d2b20d960d/events.out.tfevents.1712366264.b7d2b20d960d.1095.0 +2 -2
test_results.json +6 -6

README.md CHANGED Viewed

@@ -19,9 +19,9 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [t5-base](https://huggingface.co/t5-base) on an unknown dataset.
 It achieves the following results on the evaluation set:
 - Loss: 1.1785
-- Rouge1: 0.6772
-- Rouge2: 0.4105
-- Rougel: 0.6161
 - Rougelsum: 0.6161
 - Wer: 0.4869
 - Bleurt: 0.3779
@@ -56,21 +56,21 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Wer    | Bleurt |
 |:-------------:|:-----:|:----:|:---------------:|:------:|:------:|:------:|:---------:|:------:|:------:|
-| No log        | 0.13  | 250  | 1.3316          | 0.6509 | 0.3768 | 0.5866 | 0.5865    | 0.5217 | 0.3009 |
-| 1.7919        | 0.27  | 500  | 1.2776          | 0.6593 | 0.3865 | 0.5962 | 0.5962    | 0.5108 | 0.3009 |
-| 1.7919        | 0.4   | 750  | 1.2513          | 0.6633 | 0.3931 | 0.6015 | 0.6014    | 0.5039 | 0.3009 |
-| 1.3552        | 0.53  | 1000 | 1.2326          | 0.6667 | 0.3967 | 0.6048 | 0.6047    | 0.5008 | 0.3009 |
-| 1.3552        | 0.66  | 1250 | 1.2236          | 0.669  | 0.4    | 0.6072 | 0.6072    | 0.4972 | 0.3314 |
-| 1.3074        | 0.8   | 1500 | 1.2118          | 0.6711 | 0.4022 | 0.6093 | 0.6093    | 0.4953 | 0.3314 |
-| 1.3074        | 0.93  | 1750 | 1.2022          | 0.6714 | 0.4034 | 0.6105 | 0.6104    | 0.4932 | 0.2798 |
-| 1.3037        | 1.06  | 2000 | 1.1972          | 0.673  | 0.4053 | 0.6117 | 0.6116    | 0.4916 | 0.3771 |
-| 1.3037        | 1.2   | 2250 | 1.1909          | 0.6749 | 0.4068 | 0.6136 | 0.6135    | 0.4905 | 0.3314 |
-| 1.2676        | 1.33  | 2500 | 1.1889          | 0.676  | 0.4086 | 0.6143 | 0.6143    | 0.4893 | 0.3314 |
-| 1.2676        | 1.46  | 2750 | 1.1848          | 0.6763 | 0.4091 | 0.615  | 0.6149    | 0.4884 | 0.3314 |
-| 1.2796        | 1.6   | 3000 | 1.1829          | 0.677  | 0.4095 | 0.6154 | 0.6154    | 0.488  | 0.3123 |
-| 1.2796        | 1.73  | 3250 | 1.1808          | 0.6767 | 0.41   | 0.6157 | 0.6157    | 0.4876 | 0.3779 |
-| 1.2489        | 1.86  | 3500 | 1.1787          | 0.6771 | 0.4105 | 0.616  | 0.616     | 0.4869 | 0.3771 |
-| 1.2489        | 1.99  | 3750 | 1.1785          | 0.6772 | 0.4105 | 0.6161 | 0.6161    | 0.4869 | 0.3779 |
 ### Framework versions

 This model is a fine-tuned version of [t5-base](https://huggingface.co/t5-base) on an unknown dataset.
 It achieves the following results on the evaluation set:
 - Loss: 1.1785
+- Rouge1: 0.6774
+- Rouge2: 0.4106
+- Rougel: 0.6163
 - Rougelsum: 0.6161
 - Wer: 0.4869
 - Bleurt: 0.3779
 | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Wer    | Bleurt |
 |:-------------:|:-----:|:----:|:---------------:|:------:|:------:|:------:|:---------:|:------:|:------:|
+| No log        | 0.13  | 250  | 1.3316          | 0.6511 | 0.3769 | 0.5868 | 0.5866    | 0.5217 | 0.3009 |
+| 1.7919        | 0.27  | 500  | 1.2776          | 0.6595 | 0.3866 | 0.5964 | 0.5962    | 0.5108 | 0.3009 |
+| 1.7919        | 0.4   | 750  | 1.2513          | 0.6635 | 0.3932 | 0.6016 | 0.6014    | 0.5039 | 0.3009 |
+| 1.3552        | 0.53  | 1000 | 1.2326          | 0.6668 | 0.3968 | 0.605  | 0.6048    | 0.5008 | 0.3009 |
+| 1.3552        | 0.66  | 1250 | 1.2236          | 0.6692 | 0.4    | 0.6073 | 0.6072    | 0.4972 | 0.3314 |
+| 1.3074        | 0.8   | 1500 | 1.2118          | 0.6713 | 0.4023 | 0.6094 | 0.6093    | 0.4953 | 0.3314 |
+| 1.3074        | 0.93  | 1750 | 1.2022          | 0.6716 | 0.4035 | 0.6106 | 0.6105    | 0.4932 | 0.2798 |
+| 1.3037        | 1.06  | 2000 | 1.1972          | 0.6731 | 0.4053 | 0.6118 | 0.6117    | 0.4916 | 0.3771 |
+| 1.3037        | 1.2   | 2250 | 1.1909          | 0.675  | 0.4069 | 0.6136 | 0.6135    | 0.4905 | 0.3314 |
+| 1.2676        | 1.33  | 2500 | 1.1889          | 0.6761 | 0.4087 | 0.6144 | 0.6143    | 0.4893 | 0.3314 |
+| 1.2676        | 1.46  | 2750 | 1.1848          | 0.6764 | 0.4091 | 0.6151 | 0.615     | 0.4884 | 0.3314 |
+| 1.2796        | 1.6   | 3000 | 1.1829          | 0.6771 | 0.4096 | 0.6156 | 0.6154    | 0.488  | 0.3123 |
+| 1.2796        | 1.73  | 3250 | 1.1808          | 0.6769 | 0.4101 | 0.6159 | 0.6158    | 0.4876 | 0.3779 |
+| 1.2489        | 1.86  | 3500 | 1.1787          | 0.6772 | 0.4106 | 0.6162 | 0.6161    | 0.4869 | 0.3771 |
+| 1.2489        | 1.99  | 3750 | 1.1785          | 0.6774 | 0.4106 | 0.6163 | 0.6161    | 0.4869 | 0.3779 |
 ### Framework versions

all_results.json CHANGED Viewed

@@ -3,10 +3,10 @@
     "test_WER": 0.4816,
     "test_loss": 1.195426344871521,
     "test_rouge1": 0.6827,
-    "test_rouge2": 0.4184,
-    "test_rougeL": 0.6228,
-    "test_rougeLsum": 0.6222,
-    "test_runtime": 31.0979,
-    "test_samples_per_second": 12.123,
-    "test_steps_per_second": 2.026
 }

     "test_WER": 0.4816,
     "test_loss": 1.195426344871521,
     "test_rouge1": 0.6827,
+    "test_rouge2": 0.419,
+    "test_rougeL": 0.6225,
+    "test_rougeLsum": 0.6227,
+    "test_runtime": 42.9332,
+    "test_samples_per_second": 8.781,
+    "test_steps_per_second": 1.467
 }

runs/Apr06_01-17-41_b7d2b20d960d/events.out.tfevents.1712366264.b7d2b20d960d.1095.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:04db99cb387add81f24da4967b2a7b03a5e37075d0309ef7d8c5c429700eb8bb
-size 13689

 version https://git-lfs.github.com/spec/v1
+oid sha256:aa459e6ae38a9886eba484d6131d7ff20d70d1a3ce2569c59c7ad757726e2104
+size 15967

test_results.json CHANGED Viewed

@@ -3,10 +3,10 @@
     "test_WER": 0.4816,
     "test_loss": 1.195426344871521,
     "test_rouge1": 0.6827,
-    "test_rouge2": 0.4184,
-    "test_rougeL": 0.6228,
-    "test_rougeLsum": 0.6222,
-    "test_runtime": 31.0979,
-    "test_samples_per_second": 12.123,
-    "test_steps_per_second": 2.026
 }

     "test_WER": 0.4816,
     "test_loss": 1.195426344871521,
     "test_rouge1": 0.6827,
+    "test_rouge2": 0.419,
+    "test_rougeL": 0.6225,
+    "test_rougeLsum": 0.6227,
+    "test_runtime": 42.9332,
+    "test_samples_per_second": 8.781,
+    "test_steps_per_second": 1.467
 }