End of training
Browse files- README.md +40 -9
- config.json +1 -1
- generation_config.json +1 -1
- model.safetensors +1 -1
- runs/Sep23_04-48-23_1838c69cedab/events.out.tfevents.1727066904.1838c69cedab.1885.0 +3 -0
- tokenizer.json +1 -6
- training_args.bin +2 -2
README.md
CHANGED
@@ -1,4 +1,5 @@
|
|
1 |
---
|
|
|
2 |
license: mit
|
3 |
base_model: gpt2
|
4 |
tags:
|
@@ -15,12 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
|
|
15 |
|
16 |
This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on an unknown dataset.
|
17 |
It achieves the following results on the evaluation set:
|
18 |
-
-
|
19 |
-
- eval_runtime: 13.3388
|
20 |
-
- eval_samples_per_second: 1030.149
|
21 |
-
- eval_steps_per_second: 32.237
|
22 |
-
- epoch: 1.6071
|
23 |
-
- step: 90
|
24 |
|
25 |
## Model description
|
26 |
|
@@ -51,9 +47,44 @@ The following hyperparameters were used during training:
|
|
51 |
- num_epochs: 5
|
52 |
- mixed_precision_training: Native AMP
|
53 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
54 |
### Framework versions
|
55 |
|
56 |
-
- Transformers 4.
|
57 |
-
- Pytorch 2.
|
58 |
-
- Datasets
|
59 |
- Tokenizers 0.19.1
|
|
|
1 |
---
|
2 |
+
library_name: transformers
|
3 |
license: mit
|
4 |
base_model: gpt2
|
5 |
tags:
|
|
|
16 |
|
17 |
This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on an unknown dataset.
|
18 |
It achieves the following results on the evaluation set:
|
19 |
+
- Loss: 5.0287
|
|
|
|
|
|
|
|
|
|
|
20 |
|
21 |
## Model description
|
22 |
|
|
|
47 |
- num_epochs: 5
|
48 |
- mixed_precision_training: Native AMP
|
49 |
|
50 |
+
### Training results
|
51 |
+
|
52 |
+
| Training Loss | Epoch | Step | Validation Loss |
|
53 |
+
|:-------------:|:------:|:----:|:---------------:|
|
54 |
+
| 9.5172 | 0.1699 | 10 | 8.0210 |
|
55 |
+
| 7.1368 | 0.3397 | 20 | 7.3939 |
|
56 |
+
| 6.7858 | 0.5096 | 30 | 6.8556 |
|
57 |
+
| 6.3872 | 0.6794 | 40 | 6.6165 |
|
58 |
+
| 6.0964 | 0.8493 | 50 | 6.3605 |
|
59 |
+
| 5.8534 | 1.0191 | 60 | 6.1202 |
|
60 |
+
| 5.6031 | 1.1890 | 70 | 5.9613 |
|
61 |
+
| 5.4271 | 1.3588 | 80 | 5.8534 |
|
62 |
+
| 5.3319 | 1.5287 | 90 | 5.7526 |
|
63 |
+
| 5.1911 | 1.6985 | 100 | 5.6603 |
|
64 |
+
| 5.1143 | 1.8684 | 110 | 5.5964 |
|
65 |
+
| 5.024 | 2.0382 | 120 | 5.5203 |
|
66 |
+
| 4.8772 | 2.2081 | 130 | 5.4652 |
|
67 |
+
| 4.8455 | 2.3779 | 140 | 5.4071 |
|
68 |
+
| 4.7629 | 2.5478 | 150 | 5.3446 |
|
69 |
+
| 4.6666 | 2.7176 | 160 | 5.2905 |
|
70 |
+
| 4.6672 | 2.8875 | 170 | 5.2415 |
|
71 |
+
| 4.5738 | 3.0573 | 180 | 5.2033 |
|
72 |
+
| 4.4949 | 3.2272 | 190 | 5.1688 |
|
73 |
+
| 4.4406 | 3.3970 | 200 | 5.1329 |
|
74 |
+
| 4.4166 | 3.5669 | 210 | 5.1085 |
|
75 |
+
| 4.3886 | 3.7367 | 220 | 5.0823 |
|
76 |
+
| 4.3302 | 3.9066 | 230 | 5.0652 |
|
77 |
+
| 4.3089 | 4.0764 | 240 | 5.0498 |
|
78 |
+
| 4.2768 | 4.2463 | 250 | 5.0409 |
|
79 |
+
| 4.2667 | 4.4161 | 260 | 5.0344 |
|
80 |
+
| 4.2604 | 4.5860 | 270 | 5.0300 |
|
81 |
+
| 4.2389 | 4.7558 | 280 | 5.0290 |
|
82 |
+
| 4.2726 | 4.9257 | 290 | 5.0287 |
|
83 |
+
|
84 |
+
|
85 |
### Framework versions
|
86 |
|
87 |
+
- Transformers 4.44.2
|
88 |
+
- Pytorch 2.4.1+cu121
|
89 |
+
- Datasets 3.0.0
|
90 |
- Tokenizers 0.19.1
|
config.json
CHANGED
@@ -33,7 +33,7 @@
|
|
33 |
}
|
34 |
},
|
35 |
"torch_dtype": "float32",
|
36 |
-
"transformers_version": "4.
|
37 |
"use_cache": true,
|
38 |
"vocab_size": 50000
|
39 |
}
|
|
|
33 |
}
|
34 |
},
|
35 |
"torch_dtype": "float32",
|
36 |
+
"transformers_version": "4.44.2",
|
37 |
"use_cache": true,
|
38 |
"vocab_size": 50000
|
39 |
}
|
generation_config.json
CHANGED
@@ -2,5 +2,5 @@
|
|
2 |
"_from_model_config": true,
|
3 |
"bos_token_id": 0,
|
4 |
"eos_token_id": 0,
|
5 |
-
"transformers_version": "4.
|
6 |
}
|
|
|
2 |
"_from_model_config": true,
|
3 |
"bos_token_id": 0,
|
4 |
"eos_token_id": 0,
|
5 |
+
"transformers_version": "4.44.2"
|
6 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 496984704
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f430019026db6ff200038e7a0108878658540ca89445c55c151c654e439fee9d
|
3 |
size 496984704
|
runs/Sep23_04-48-23_1838c69cedab/events.out.tfevents.1727066904.1838c69cedab.1885.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33fe3a7a122dc6eb813f08ffba3629bd217c14cd8fefa728e45ff456a97a102d
|
3 |
+
size 19345
|
tokenizer.json
CHANGED
@@ -1,11 +1,6 @@
|
|
1 |
{
|
2 |
"version": "1.0",
|
3 |
-
"truncation":
|
4 |
-
"direction": "Right",
|
5 |
-
"max_length": 128,
|
6 |
-
"strategy": "LongestFirst",
|
7 |
-
"stride": 0
|
8 |
-
},
|
9 |
"padding": null,
|
10 |
"added_tokens": [
|
11 |
{
|
|
|
1 |
{
|
2 |
"version": "1.0",
|
3 |
+
"truncation": null,
|
|
|
|
|
|
|
|
|
|
|
4 |
"padding": null,
|
5 |
"added_tokens": [
|
6 |
{
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:150690969cd7b3c9177d8824a179025f0f5cd07d5f9c03eb90877394a6e79743
|
3 |
+
size 5176
|