Trabalho/imageCaptioning
Browse files- README.md +25 -13
- config.json +1 -1
- generation_config.json +1 -1
- pytorch_model.bin +2 -2
- training_args.bin +2 -2
README.md
CHANGED
@@ -18,13 +18,13 @@ should probably proofread and complete it, then remove this comment. -->
|
|
18 |
|
19 |
This model is a fine-tuned version of [](https://huggingface.co/) on the coco dataset.
|
20 |
It achieves the following results on the evaluation set:
|
21 |
-
- Loss:
|
22 |
-
- Rouge1:
|
23 |
-
- Rouge2:
|
24 |
-
- Rougel:
|
25 |
-
- Rougelsum:
|
26 |
-
- Bleu:
|
27 |
-
- Gen Len: 11.
|
28 |
|
29 |
## Model description
|
30 |
|
@@ -44,20 +44,32 @@ More information needed
|
|
44 |
|
45 |
The following hyperparameters were used during training:
|
46 |
- learning_rate: 5e-05
|
47 |
-
- train_batch_size:
|
48 |
-
- eval_batch_size:
|
49 |
- seed: 42
|
50 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
51 |
- lr_scheduler_type: linear
|
52 |
-
- num_epochs:
|
53 |
|
54 |
### Training results
|
55 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
56 |
|
57 |
|
58 |
### Framework versions
|
59 |
|
60 |
-
- Transformers 4.34.
|
61 |
-
- Pytorch 2.0
|
62 |
-
- Datasets 2.14.
|
63 |
- Tokenizers 0.14.1
|
|
|
18 |
|
19 |
This model is a fine-tuned version of [](https://huggingface.co/) on the coco dataset.
|
20 |
It achieves the following results on the evaluation set:
|
21 |
+
- Loss: 0.8174
|
22 |
+
- Rouge1: 41.4513
|
23 |
+
- Rouge2: 15.9705
|
24 |
+
- Rougel: 37.8534
|
25 |
+
- Rougelsum: 37.8514
|
26 |
+
- Bleu: 9.9633
|
27 |
+
- Gen Len: 11.3253
|
28 |
|
29 |
## Model description
|
30 |
|
|
|
44 |
|
45 |
The following hyperparameters were used during training:
|
46 |
- learning_rate: 5e-05
|
47 |
+
- train_batch_size: 16
|
48 |
+
- eval_batch_size: 16
|
49 |
- seed: 42
|
50 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
51 |
- lr_scheduler_type: linear
|
52 |
+
- num_epochs: 2
|
53 |
|
54 |
### Training results
|
55 |
|
56 |
+
| Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Bleu | Gen Len |
|
57 |
+
|:-------------:|:-----:|:-----:|:---------------:|:-------:|:-------:|:-------:|:---------:|:------:|:-------:|
|
58 |
+
| 1.091 | 0.19 | 2000 | 0.9783 | 35.5981 | 11.1245 | 32.4533 | 32.4622 | 6.1315 | 11.3253 |
|
59 |
+
| 0.9629 | 0.38 | 4000 | 0.9306 | 36.8386 | 12.0629 | 33.7446 | 33.7445 | 6.806 | 11.3253 |
|
60 |
+
| 0.9251 | 0.57 | 6000 | 0.9004 | 37.8439 | 13.1346 | 34.663 | 34.6608 | 7.6122 | 11.3253 |
|
61 |
+
| 0.9116 | 0.75 | 8000 | 0.8759 | 38.5078 | 13.477 | 35.1981 | 35.2143 | 7.6881 | 11.3253 |
|
62 |
+
| 0.8903 | 0.94 | 10000 | 0.8592 | 39.6087 | 14.2529 | 36.0992 | 36.1042 | 8.5688 | 11.3253 |
|
63 |
+
| 0.8381 | 1.13 | 12000 | 0.8480 | 40.3217 | 15.012 | 36.8038 | 36.8046 | 9.1783 | 11.3253 |
|
64 |
+
| 0.8066 | 1.32 | 14000 | 0.8383 | 40.7187 | 15.1971 | 37.15 | 37.148 | 9.2942 | 11.3253 |
|
65 |
+
| 0.7938 | 1.51 | 16000 | 0.8298 | 41.1227 | 15.635 | 37.423 | 37.4147 | 9.6574 | 11.3253 |
|
66 |
+
| 0.7854 | 1.7 | 18000 | 0.8232 | 41.5275 | 16.007 | 37.8586 | 37.8569 | 9.8936 | 11.3253 |
|
67 |
+
| 0.7837 | 1.88 | 20000 | 0.8190 | 41.2515 | 15.8468 | 37.6257 | 37.6252 | 9.8732 | 11.3253 |
|
68 |
|
69 |
|
70 |
### Framework versions
|
71 |
|
72 |
+
- Transformers 4.34.1
|
73 |
+
- Pytorch 2.1.0+cu118
|
74 |
+
- Datasets 2.14.6
|
75 |
- Tokenizers 0.14.1
|
config.json
CHANGED
@@ -43284,5 +43284,5 @@
|
|
43284 |
"pad_token_id": 50256,
|
43285 |
"tie_word_embeddings": false,
|
43286 |
"torch_dtype": "float32",
|
43287 |
-
"transformers_version": "4.34.
|
43288 |
}
|
|
|
43284 |
"pad_token_id": 50256,
|
43285 |
"tie_word_embeddings": false,
|
43286 |
"torch_dtype": "float32",
|
43287 |
+
"transformers_version": "4.34.1"
|
43288 |
}
|
generation_config.json
CHANGED
@@ -3,5 +3,5 @@
|
|
3 |
"decoder_start_token_id": 50256,
|
4 |
"eos_token_id": 50256,
|
5 |
"pad_token_id": 50256,
|
6 |
-
"transformers_version": "4.34.
|
7 |
}
|
|
|
3 |
"decoder_start_token_id": 50256,
|
4 |
"eos_token_id": 50256,
|
5 |
"pad_token_id": 50256,
|
6 |
+
"transformers_version": "4.34.1"
|
7 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4813c749bf5afeb78278a0ac165efeecacc01bef9b28ab7d9e0e9262101c46e
|
3 |
+
size 962051678
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:182ad1ade3b89eb281ca4c2835c86503659b2aad7d918e84c37e5861d1d14e74
|
3 |
+
size 4664
|