End of training

Browse files

Files changed (5) hide show

README.md +15 -15
model.safetensors +1 -1
runs/Dec06_09-23-29_7bb9bb6007a1/events.out.tfevents.1701860367.7bb9bb6007a1.626.3 +3 -0
special_tokens_map.json +21 -3
tokenizer_config.json +7 -0

README.md CHANGED Viewed

@@ -17,12 +17,12 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [google/flan-t5-small](https://huggingface.co/google/flan-t5-small) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.1056
-- Rouge1: 59.8095
 - Rouge2: 47.0
-- Rougel: 59.8095
-- Rougelsum: 59.8095
-- Gen Len: 14.6
 ## Model description
@@ -53,16 +53,16 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss | Rouge1  | Rouge2 | Rougel  | Rougelsum | Gen Len |
 |:-------------:|:-----:|:----:|:---------------:|:-------:|:------:|:-------:|:---------:|:-------:|
-| No log        | 1.0   | 5    | 2.8921          | 15.7143 | 0.0    | 15.7143 | 15.0      | 7.2     |
-| No log        | 2.0   | 10   | 2.1172          | 19.0    | 0.0    | 19.1905 | 18.5714   | 8.2     |
-| No log        | 3.0   | 15   | 1.7513          | 33.7143 | 20.0   | 34.0    | 33.3333   | 7.8     |
-| No log        | 4.0   | 20   | 1.4905          | 46.7143 | 34.0   | 47.0476 | 46.7143   | 12.3    |
-| No log        | 5.0   | 25   | 1.3527          | 55.5714 | 39.0   | 55.4762 | 54.5714   | 12.9    |
-| No log        | 6.0   | 30   | 1.3376          | 58.0952 | 39.0   | 58.0952 | 57.4286   | 13.6    |
-| No log        | 7.0   | 35   | 1.2002          | 58.5714 | 39.0   | 58.5714 | 57.8095   | 13.3    |
-| No log        | 8.0   | 40   | 1.1349          | 55.0476 | 39.0   | 54.5714 | 54.5714   | 14.3    |
-| No log        | 9.0   | 45   | 1.1106          | 59.8095 | 47.0   | 59.8095 | 59.8095   | 14.6    |
-| No log        | 10.0  | 50   | 1.1056          | 59.8095 | 47.0   | 59.8095 | 59.8095   | 14.6    |
 ### Framework versions

 This model is a fine-tuned version of [google/flan-t5-small](https://huggingface.co/google/flan-t5-small) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.7928
+- Rouge1: 62.0833
 - Rouge2: 47.0
+- Rougel: 62.0952
+- Rougelsum: 61.2857
+- Gen Len: 14.2
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss | Rouge1  | Rouge2 | Rougel  | Rougelsum | Gen Len |
 |:-------------:|:-----:|:----:|:---------------:|:-------:|:------:|:-------:|:---------:|:-------:|
+| No log        | 1.0   | 5    | 1.0434          | 55.9048 | 39.0   | 55.9048 | 55.7143   | 13.2    |
+| No log        | 2.0   | 10   | 0.9903          | 62.7619 | 47.0   | 62.6667 | 62.7619   | 14.8    |
+| No log        | 3.0   | 15   | 0.9273          | 56.4762 | 47.0   | 56.4762 | 56.1905   | 14.4    |
+| No log        | 4.0   | 20   | 0.9185          | 60.4762 | 47.0   | 60.4762 | 59.8095   | 13.5    |
+| No log        | 5.0   | 25   | 0.8703          | 64.5714 | 47.0   | 64.4762 | 64.4762   | 13.2    |
+| No log        | 6.0   | 30   | 0.8186          | 68.1429 | 50.0   | 68.5714 | 68.0238   | 14.6    |
+| No log        | 7.0   | 35   | 0.7856          | 64.7857 | 50.0   | 64.5714 | 64.0952   | 14.4    |
+| No log        | 8.0   | 40   | 0.7755          | 64.7857 | 50.0   | 64.5714 | 64.0952   | 14.2    |
+| No log        | 9.0   | 45   | 0.7864          | 64.7857 | 50.0   | 64.5714 | 64.0952   | 14.2    |
+| No log        | 10.0  | 50   | 0.7928          | 62.0833 | 47.0   | 62.0952 | 61.2857   | 14.2    |
 ### Framework versions

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7a4e757066a16cbdea075ad0690a8bb8b2c067cfbda800feed03940145b544cf
 size 307867048

 version https://git-lfs.github.com/spec/v1
+oid sha256:24f99809e2d8febc661302df9ea87076d2e30e0ee609367643d57d2aec7679da
 size 307867048

runs/Dec06_09-23-29_7bb9bb6007a1/events.out.tfevents.1701860367.7bb9bb6007a1.626.3 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1ab79c624238634b39001e6a1218811a2ae5790beeebdbad5430c167fd73ca40
+size 10817

special_tokens_map.json CHANGED Viewed

@@ -101,7 +101,25 @@
     "<extra_id_98>",
     "<extra_id_99>"
   ],
-  "eos_token": "</s>",
-  "pad_token": "<pad>",
-  "unk_token": "<unk>"
 }

     "<extra_id_98>",
     "<extra_id_99>"
   ],
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<pad>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
 }

tokenizer_config.json CHANGED Viewed

@@ -930,9 +930,16 @@
   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 100,
   "model_max_length": 512,
   "pad_token": "<pad>",
   "sp_model_kwargs": {},
   "tokenizer_class": "T5Tokenizer",
   "unk_token": "<unk>"
 }

   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 100,
+  "max_length": 48,
   "model_max_length": 512,
+  "pad_to_multiple_of": null,
   "pad_token": "<pad>",
+  "pad_token_type_id": 0,
+  "padding_side": "right",
   "sp_model_kwargs": {},
+  "stride": 0,
   "tokenizer_class": "T5Tokenizer",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
   "unk_token": "<unk>"
 }