End of training
Browse files
README.md
CHANGED
@@ -17,12 +17,12 @@ model-index:
|
|
17 |
name: samsum
|
18 |
type: samsum
|
19 |
config: samsum
|
20 |
-
split:
|
21 |
args: samsum
|
22 |
metrics:
|
23 |
- name: Rouge1
|
24 |
type: rouge
|
25 |
-
value: 48.
|
26 |
---
|
27 |
|
28 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
@@ -32,12 +32,12 @@ should probably proofread and complete it, then remove this comment. -->
|
|
32 |
|
33 |
This model is a fine-tuned version of [google/flan-t5-base](https://huggingface.co/google/flan-t5-base) on the samsum dataset.
|
34 |
It achieves the following results on the evaluation set:
|
35 |
-
- Loss: 1.
|
36 |
-
- Rouge1: 48.
|
37 |
-
- Rouge2: 24.
|
38 |
-
- Rougel:
|
39 |
-
- Rougelsum:
|
40 |
-
- Gen Len:
|
41 |
|
42 |
## Model description
|
43 |
|
@@ -68,9 +68,9 @@ The following hyperparameters were used during training:
|
|
68 |
|
69 |
| Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Gen Len |
|
70 |
|:-------------:|:-----:|:----:|:---------------:|:-------:|:-------:|:-------:|:---------:|:-------:|
|
71 |
-
| 1.
|
72 |
-
| 1.
|
73 |
-
| 1.
|
74 |
|
75 |
|
76 |
### Framework versions
|
|
|
17 |
name: samsum
|
18 |
type: samsum
|
19 |
config: samsum
|
20 |
+
split: validation
|
21 |
args: samsum
|
22 |
metrics:
|
23 |
- name: Rouge1
|
24 |
type: rouge
|
25 |
+
value: 48.5717
|
26 |
---
|
27 |
|
28 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
|
|
32 |
|
33 |
This model is a fine-tuned version of [google/flan-t5-base](https://huggingface.co/google/flan-t5-base) on the samsum dataset.
|
34 |
It achieves the following results on the evaluation set:
|
35 |
+
- Loss: 1.3743
|
36 |
+
- Rouge1: 48.5717
|
37 |
+
- Rouge2: 24.9633
|
38 |
+
- Rougel: 39.1532
|
39 |
+
- Rougelsum: 45.0174
|
40 |
+
- Gen Len: 36.8362
|
41 |
|
42 |
## Model description
|
43 |
|
|
|
68 |
|
69 |
| Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Gen Len |
|
70 |
|:-------------:|:-----:|:----:|:---------------:|:-------:|:-------:|:-------:|:---------:|:-------:|
|
71 |
+
| 1.452 | 1.0 | 1842 | 1.3851 | 48.5682 | 25.1167 | 39.2504 | 45.1912 | 36.8753 |
|
72 |
+
| 1.3402 | 2.0 | 3684 | 1.3743 | 48.5717 | 24.9633 | 39.1532 | 45.0174 | 36.8362 |
|
73 |
+
| 1.2928 | 3.0 | 5526 | 1.3748 | 48.7401 | 25.0144 | 39.1959 | 45.1242 | 36.9438 |
|
74 |
|
75 |
|
76 |
### Framework versions
|
generation_config.json
CHANGED
@@ -1,18 +1,12 @@
|
|
1 |
{
|
2 |
-
|
3 |
-
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
|
12 |
-
no_repeat_ngram_size = 3,
|
13 |
-
eos_token_id = model.generation_config.eos_token_id,
|
14 |
-
pad_token_id = model.generation_config.pad_token_id,
|
15 |
-
forced_bos_token_id = 0,
|
16 |
-
forced_eos_token_id = 2,
|
17 |
-
top_k=0
|
18 |
}
|
|
|
1 |
{
|
2 |
+
"decoder_start_token_id": 0,
|
3 |
+
"early_stopping": true,
|
4 |
+
"eos_token_id": 1,
|
5 |
+
"length_penalty": 2.0,
|
6 |
+
"max_length": 200,
|
7 |
+
"min_length": 30,
|
8 |
+
"no_repeat_ngram_size": 3,
|
9 |
+
"num_beams": 4,
|
10 |
+
"pad_token_id": 0,
|
11 |
+
"transformers_version": "4.42.3"
|
|
|
|
|
|
|
|
|
|
|
|
|
12 |
}
|
logs/events.out.tfevents.1720196349.234005ae3c44.359.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3479a6a4adc1f5bd1e18c1ad0c9aec24007a730e109052ab3c36e70f2c495dfa
|
3 |
+
size 10286
|
logs/events.out.tfevents.1720204799.234005ae3c44.359.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88e81d8a092ea862e1696b879c9bdbf7a54767c67b3611ec5f08d42399ed3e41
|
3 |
+
size 613
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 990345064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0717b46811c95a40d76c6e45a697546c1f04d16a430de4a45c7d6acb7d076ee8
|
3 |
size 990345064
|