jgibb commited on
Commit
d1c362a
1 Parent(s): 26c1a6d

training completed[dev]: 512 128

Browse files
README.md CHANGED
@@ -18,13 +18,13 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [t5-base](https://huggingface.co/t5-base) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 1.1785
22
- - Rouge1: 0.6774
23
- - Rouge2: 0.4106
24
- - Rougel: 0.6163
25
- - Rougelsum: 0.6162
26
- - Wer: 0.4869
27
- - Bleurt: 0.3779
28
 
29
  ## Model description
30
 
@@ -56,21 +56,20 @@ The following hyperparameters were used during training:
56
 
57
  | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Wer | Bleurt |
58
  |:-------------:|:-----:|:----:|:---------------:|:------:|:------:|:------:|:---------:|:------:|:------:|
59
- | No log | 0.13 | 250 | 1.3316 | 0.651 | 0.3769 | 0.5867 | 0.5868 | 0.5217 | 0.3009 |
60
- | 1.7919 | 0.27 | 500 | 1.2776 | 0.6595 | 0.3865 | 0.5963 | 0.5963 | 0.5108 | 0.3009 |
61
- | 1.7919 | 0.4 | 750 | 1.2513 | 0.6635 | 0.393 | 0.6015 | 0.6016 | 0.5039 | 0.3009 |
62
- | 1.3552 | 0.53 | 1000 | 1.2326 | 0.6668 | 0.3967 | 0.6049 | 0.6049 | 0.5008 | 0.3009 |
63
- | 1.3552 | 0.66 | 1250 | 1.2236 | 0.6692 | 0.4 | 0.6073 | 0.6073 | 0.4972 | 0.3314 |
64
- | 1.3074 | 0.8 | 1500 | 1.2118 | 0.6713 | 0.4022 | 0.6094 | 0.6094 | 0.4953 | 0.3314 |
65
- | 1.3074 | 0.93 | 1750 | 1.2022 | 0.6715 | 0.4035 | 0.6106 | 0.6106 | 0.4932 | 0.2798 |
66
- | 1.3037 | 1.06 | 2000 | 1.1972 | 0.6731 | 0.4053 | 0.6118 | 0.6118 | 0.4916 | 0.3771 |
67
- | 1.3037 | 1.2 | 2250 | 1.1909 | 0.675 | 0.4068 | 0.6137 | 0.6136 | 0.4905 | 0.3314 |
68
- | 1.2676 | 1.33 | 2500 | 1.1889 | 0.6761 | 0.4087 | 0.6144 | 0.6144 | 0.4893 | 0.3314 |
69
- | 1.2676 | 1.46 | 2750 | 1.1848 | 0.6763 | 0.4091 | 0.6151 | 0.6151 | 0.4884 | 0.3314 |
70
- | 1.2796 | 1.6 | 3000 | 1.1829 | 0.6771 | 0.4095 | 0.6155 | 0.6155 | 0.488 | 0.3123 |
71
- | 1.2796 | 1.73 | 3250 | 1.1808 | 0.6769 | 0.4101 | 0.6159 | 0.6159 | 0.4876 | 0.3779 |
72
- | 1.2489 | 1.86 | 3500 | 1.1787 | 0.6772 | 0.4105 | 0.6162 | 0.6162 | 0.4869 | 0.3771 |
73
- | 1.2489 | 1.99 | 3750 | 1.1785 | 0.6774 | 0.4106 | 0.6163 | 0.6162 | 0.4869 | 0.3779 |
74
 
75
 
76
  ### Framework versions
 
18
 
19
  This model is a fine-tuned version of [t5-base](https://huggingface.co/t5-base) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 1.1670
22
+ - Rouge1: 0.6791
23
+ - Rouge2: 0.4136
24
+ - Rougel: 0.6183
25
+ - Rougelsum: 0.6185
26
+ - Wer: 0.4846
27
+ - Bleurt: 0.3314
28
 
29
  ## Model description
30
 
 
56
 
57
  | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Wer | Bleurt |
58
  |:-------------:|:-----:|:----:|:---------------:|:------:|:------:|:------:|:---------:|:------:|:------:|
59
+ | No log | 0.14 | 250 | 1.3197 | 0.6548 | 0.3804 | 0.5904 | 0.5905 | 0.5188 | 0.3009 |
60
+ | 1.7026 | 0.27 | 500 | 1.2676 | 0.6613 | 0.3904 | 0.5985 | 0.5987 | 0.5074 | 0.3009 |
61
+ | 1.7026 | 0.41 | 750 | 1.2385 | 0.6664 | 0.3961 | 0.6043 | 0.6044 | 0.5023 | 0.3009 |
62
+ | 1.3446 | 0.55 | 1000 | 1.2234 | 0.6691 | 0.4009 | 0.6075 | 0.6076 | 0.4972 | 0.3009 |
63
+ | 1.3446 | 0.68 | 1250 | 1.2089 | 0.671 | 0.4031 | 0.6099 | 0.6101 | 0.4944 | 0.3009 |
64
+ | 1.309 | 0.82 | 1500 | 1.1983 | 0.673 | 0.4064 | 0.6121 | 0.6123 | 0.4914 | 0.3009 |
65
+ | 1.309 | 0.96 | 1750 | 1.1900 | 0.6744 | 0.4075 | 0.6136 | 0.6137 | 0.4897 | 0.3009 |
66
+ | 1.2783 | 1.09 | 2000 | 1.1840 | 0.6744 | 0.4082 | 0.614 | 0.6141 | 0.4889 | 0.2798 |
67
+ | 1.2783 | 1.23 | 2250 | 1.1808 | 0.6759 | 0.4102 | 0.6154 | 0.6156 | 0.4875 | 0.2944 |
68
+ | 1.2683 | 1.36 | 2500 | 1.1763 | 0.6771 | 0.4111 | 0.6163 | 0.6165 | 0.4863 | 0.3153 |
69
+ | 1.2683 | 1.5 | 2750 | 1.1720 | 0.6772 | 0.4115 | 0.6169 | 0.617 | 0.4859 | 0.4109 |
70
+ | 1.2469 | 1.64 | 3000 | 1.1701 | 0.6783 | 0.4127 | 0.6176 | 0.6178 | 0.485 | 0.3314 |
71
+ | 1.2469 | 1.77 | 3250 | 1.1680 | 0.6786 | 0.4131 | 0.6178 | 0.6179 | 0.4849 | 0.3314 |
72
+ | 1.2171 | 1.91 | 3500 | 1.1670 | 0.6791 | 0.4136 | 0.6183 | 0.6185 | 0.4846 | 0.3314 |
 
73
 
74
 
75
  ### Framework versions
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "test_BLEURT": -0.9706,
3
- "test_WER": 0.4816,
4
- "test_loss": 1.195426344871521,
5
- "test_rouge1": 0.6823,
6
- "test_rouge2": 0.4189,
7
- "test_rougeL": 0.6225,
8
- "test_rougeLsum": 0.6219,
9
- "test_runtime": 31.876,
10
- "test_samples_per_second": 11.827,
11
- "test_steps_per_second": 1.976
12
  }
 
1
  {
2
+ "test_BLEURT": -0.2487,
3
+ "test_WER": 0.4777,
4
+ "test_loss": 1.1913501024246216,
5
+ "test_rouge1": 0.6851,
6
+ "test_rouge2": 0.4239,
7
+ "test_rougeL": 0.6255,
8
+ "test_rougeLsum": 0.6251,
9
+ "test_runtime": 47.9856,
10
+ "test_samples_per_second": 7.648,
11
+ "test_steps_per_second": 1.292
12
  }
runs/Mar31_00-46-22_93badbe1494c/events.out.tfevents.1711845988.93badbe1494c.1089.4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:92de8cf168085f39077b66f045dcb36160c73f8d95f7b4db8cfd08797a1fa9fe
3
- size 13689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b30a6d758090b185f3db856fb28d44937b8f67936c95a5cf1440a886cddac253
3
+ size 15396
test_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "test_BLEURT": -0.9706,
3
- "test_WER": 0.4816,
4
- "test_loss": 1.195426344871521,
5
- "test_rouge1": 0.6823,
6
- "test_rouge2": 0.4189,
7
- "test_rougeL": 0.6225,
8
- "test_rougeLsum": 0.6219,
9
- "test_runtime": 31.876,
10
- "test_samples_per_second": 11.827,
11
- "test_steps_per_second": 1.976
12
  }
 
1
  {
2
+ "test_BLEURT": -0.2487,
3
+ "test_WER": 0.4777,
4
+ "test_loss": 1.1913501024246216,
5
+ "test_rouge1": 0.6851,
6
+ "test_rouge2": 0.4239,
7
+ "test_rougeL": 0.6255,
8
+ "test_rougeLsum": 0.6251,
9
+ "test_runtime": 47.9856,
10
+ "test_samples_per_second": 7.648,
11
+ "test_steps_per_second": 1.292
12
  }