DiwasDiwas/t5-small-MedicoSummarizer

Browse files

Files changed (8) hide show

README.md +22 -18
all_results.json +10 -10
model.safetensors +1 -1
runs/Dec20_03-30-55_ef67406028e0/events.out.tfevents.1703043056.ef67406028e0.513.0 +3 -0
runs/Dec20_03-30-55_ef67406028e0/events.out.tfevents.1703058313.ef67406028e0.513.1 +3 -0
special_tokens_map.json +3 -21
tokenizer_config.json +0 -4
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -15,19 +15,18 @@ should probably proofread and complete it, then remove this comment. -->
 # t5-small-MedicoSummarizer
-This model is a fine-tuned version of [t5-small](https://huggingface.co/t5-small) on 30,000 PubMed articles.
 It achieves the following results on the evaluation set:
-- Loss: 2.9048
-- Rouge1: 0.3226
-- Rouge2: 0.0771
-- Rougel: 0.1964
-- Rougelsum: 0.1967
-- Gen Len: 123.675
 ## Model description
-The inference engine doesn't do justice to its operation as the inference engine API doesn't work good for trainer checkpoints !
-So, you should rather load it on the pipeline and just try it !
 ## Intended uses & limitations
@@ -48,23 +47,28 @@ The following hyperparameters were used during training:
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
-- num_epochs: 5
 - mixed_precision_training: Native AMP
 ### Training results
-| Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Gen Len |
-|:-------------:|:-----:|:----:|:---------------:|:------:|:------:|:------:|:---------:|:-------:|
-| 3.231         | 1.0   | 1875 | 2.9942          | 0.3149 | 0.0721 | 0.1871 | 0.1873    | 119.685 |
-| 3.153         | 2.0   | 3750 | 2.9426          | 0.3204 | 0.0758 | 0.1935 | 0.1936    | 122.484 |
-| 3.1201        | 3.0   | 5625 | 2.9209          | 0.3215 | 0.0753 | 0.195  | 0.1951    | 123.496 |
-| 3.1008        | 4.0   | 7500 | 2.9072          | 0.3232 | 0.0771 | 0.1969 | 0.1971    | 123.414 |
-| 3.0925        | 5.0   | 9375 | 2.9048          | 0.3226 | 0.0771 | 0.1964 | 0.1967    | 123.675 |
 ### Framework versions
 - Transformers 4.35.2
-- Pytorch 2.1.0+cu118
 - Datasets 2.15.0
 - Tokenizers 0.15.0

 # t5-small-MedicoSummarizer
+This model is a fine-tuned version of [t5-small](https://huggingface.co/t5-small) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 2.8533
+- Rouge1: 0.3234
+- Rouge2: 0.0787
+- Rougel: 0.1967
+- Rougelsum: 0.1965
+- Gen Len: 123.98
 ## Model description
+More information needed
 ## Intended uses & limitations
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
+- num_epochs: 10
 - mixed_precision_training: Native AMP
 ### Training results
+| Training Loss | Epoch | Step  | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Gen Len |
+|:-------------:|:-----:|:-----:|:---------------:|:------:|:------:|:------:|:---------:|:-------:|
+| 3.2353        | 1.0   | 1563  | 2.9967          | 0.3034 | 0.0717 | 0.1837 | 0.1836    | 117.308 |
+| 3.1623        | 2.0   | 3126  | 2.9421          | 0.3178 | 0.0763 | 0.1941 | 0.1941    | 121.529 |
+| 3.1149        | 3.0   | 4689  | 2.9152          | 0.3223 | 0.078  | 0.1964 | 0.1964    | 123.223 |
+| 3.1038        | 4.0   | 6252  | 2.8929          | 0.3245 | 0.0793 | 0.1979 | 0.1978    | 123.491 |
+| 3.0728        | 5.0   | 7815  | 2.8802          | 0.3227 | 0.0777 | 0.1973 | 0.1972    | 123.6   |
+| 3.0592        | 6.0   | 9378  | 2.8714          | 0.3213 | 0.0788 | 0.1966 | 0.1965    | 123.604 |
+| 3.0448        | 7.0   | 10941 | 2.8635          | 0.3211 | 0.0776 | 0.1959 | 0.1957    | 123.632 |
+| 3.0416        | 8.0   | 12504 | 2.8561          | 0.3204 | 0.0777 | 0.1957 | 0.1955    | 123.851 |
+| 3.0324        | 9.0   | 14067 | 2.8548          | 0.3237 | 0.0788 | 0.1965 | 0.1963    | 123.934 |
+| 3.0375        | 10.0  | 15630 | 2.8533          | 0.3234 | 0.0787 | 0.1967 | 0.1965    | 123.98  |
 ### Framework versions
 - Transformers 4.35.2
+- Pytorch 2.1.0+cu121
 - Datasets 2.15.0
 - Tokenizers 0.15.0

all_results.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
-    "epoch": 5.0,
-    "eval_gen_len": 123.675,
-    "eval_loss": 2.904787540435791,
-    "eval_rouge1": 0.3226,
-    "eval_rouge2": 0.0771,
-    "eval_rougeL": 0.1964,
-    "eval_rougeLsum": 0.1967,
-    "eval_runtime": 164.4164,
-    "eval_samples_per_second": 6.082,
-    "eval_steps_per_second": 0.383
 }

 {
+    "epoch": 10.0,
+    "eval_gen_len": 123.98,
+    "eval_loss": 2.8532516956329346,
+    "eval_rouge1": 0.3234,
+    "eval_rouge2": 0.0787,
+    "eval_rougeL": 0.1967,
+    "eval_rougeLsum": 0.1965,
+    "eval_runtime": 167.6714,
+    "eval_samples_per_second": 5.964,
+    "eval_steps_per_second": 0.376
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:959f21d96c94eb5fa45ea62693f65afd82444e2456585a779905bdc34e7a6192
 size 242041896

 version https://git-lfs.github.com/spec/v1
+oid sha256:798869b617260d70b9385c41c02644adddd6f1b024c402b9352b4e9b55500e1c
 size 242041896

runs/Dec20_03-30-55_ef67406028e0/events.out.tfevents.1703043056.ef67406028e0.513.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:230b1cbd625d1c93a25550baab5d4ebf11b3e0699c1fa16ca3d34a9ca13c61e6
+size 15690

runs/Dec20_03-30-55_ef67406028e0/events.out.tfevents.1703058313.ef67406028e0.513.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5cc31494c2312d2dd1d5058c04a7db0006be27d1e1ddd2d5d6c85df27057745
+size 613

special_tokens_map.json CHANGED Viewed

@@ -101,25 +101,7 @@
     "<extra_id_98>",
     "<extra_id_99>"
   ],
-  "eos_token": {
-    "content": "</s>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "pad_token": {
-    "content": "<pad>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "unk_token": {
-    "content": "<unk>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  }
 }

     "<extra_id_98>",
     "<extra_id_99>"
   ],
+  "eos_token": "</s>",
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
 }

tokenizer_config.json CHANGED Viewed

@@ -931,12 +931,8 @@
   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 100,
-  "max_length": 128,
   "model_max_length": 512,
   "pad_token": "<pad>",
-  "stride": 0,
   "tokenizer_class": "T5Tokenizer",
-  "truncation_side": "right",
-  "truncation_strategy": "longest_first",
   "unk_token": "<unk>"
 }

   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 100,
   "model_max_length": 512,
   "pad_token": "<pad>",
   "tokenizer_class": "T5Tokenizer",
   "unk_token": "<unk>"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:459e0ba38d7350474ee4d0d03e220420a9554159f87d4056a357225a48ee2a7a
 size 4856

 version https://git-lfs.github.com/spec/v1
+oid sha256:a6b9527ce9981eb9cdd15fed72f7b10e586f1e033ee34d9f0a1a68c59d14aa0d
 size 4856