Training in progress epoch 0
Browse files- README.md +4 -66
- config.json +1 -1
- tf_model.h5 +2 -2
- tokenizer.json +0 -0
README.md
CHANGED
@@ -13,9 +13,9 @@ probably proofread and complete it, then remove this comment. -->
|
|
13 |
|
14 |
This model is a fine-tuned version of [madatnlp/ke-t5-math-py](https://huggingface.co/madatnlp/ke-t5-math-py) on an unknown dataset.
|
15 |
It achieves the following results on the evaluation set:
|
16 |
-
- Train Loss:
|
17 |
-
- Validation Loss:
|
18 |
-
- Epoch:
|
19 |
|
20 |
## Model description
|
21 |
|
@@ -41,69 +41,7 @@ The following hyperparameters were used during training:
|
|
41 |
|
42 |
| Train Loss | Validation Loss | Epoch |
|
43 |
|:----------:|:---------------:|:-----:|
|
44 |
-
| 8.
|
45 |
-
| 4.8177 | 3.6298 | 1 |
|
46 |
-
| 3.7818 | 2.9571 | 2 |
|
47 |
-
| 3.1838 | 2.6057 | 3 |
|
48 |
-
| 2.9168 | 2.2649 | 4 |
|
49 |
-
| 2.6802 | 2.1726 | 5 |
|
50 |
-
| 2.4846 | 1.9500 | 6 |
|
51 |
-
| 2.3544 | 1.8473 | 7 |
|
52 |
-
| 2.2090 | 1.9038 | 8 |
|
53 |
-
| 2.1377 | 1.7177 | 9 |
|
54 |
-
| 2.0199 | 1.7486 | 10 |
|
55 |
-
| 1.9425 | 1.7548 | 11 |
|
56 |
-
| 1.9077 | 1.6535 | 12 |
|
57 |
-
| 1.8587 | 1.6882 | 13 |
|
58 |
-
| 1.7940 | 1.5747 | 14 |
|
59 |
-
| 1.7580 | 1.5802 | 15 |
|
60 |
-
| 1.6726 | 1.6279 | 16 |
|
61 |
-
| 1.6797 | 1.4446 | 17 |
|
62 |
-
| 1.6454 | 1.4076 | 18 |
|
63 |
-
| 1.6210 | 1.4485 | 19 |
|
64 |
-
| 1.5961 | 1.3576 | 20 |
|
65 |
-
| 1.5489 | 1.3601 | 21 |
|
66 |
-
| 1.5157 | 1.3144 | 22 |
|
67 |
-
| 1.4978 | 1.3140 | 23 |
|
68 |
-
| 1.4719 | 1.3428 | 24 |
|
69 |
-
| 1.4585 | 1.2431 | 25 |
|
70 |
-
| 1.4342 | 1.2828 | 26 |
|
71 |
-
| 1.3962 | 1.2625 | 27 |
|
72 |
-
| 1.4092 | 1.1976 | 28 |
|
73 |
-
| 1.3675 | 1.1740 | 29 |
|
74 |
-
| 1.3708 | 1.2612 | 30 |
|
75 |
-
| 1.3305 | 1.1599 | 31 |
|
76 |
-
| 1.3393 | 1.1862 | 32 |
|
77 |
-
| 1.3057 | 1.1180 | 33 |
|
78 |
-
| 1.2774 | 1.1649 | 34 |
|
79 |
-
| 1.3060 | 1.1652 | 35 |
|
80 |
-
| 1.2731 | 1.1321 | 36 |
|
81 |
-
| 1.2395 | 1.0716 | 37 |
|
82 |
-
| 1.2488 | 1.1154 | 38 |
|
83 |
-
| 1.2341 | 1.0532 | 39 |
|
84 |
-
| 1.2168 | 1.1519 | 40 |
|
85 |
-
| 1.2028 | 1.1080 | 41 |
|
86 |
-
| 1.1993 | 1.0462 | 42 |
|
87 |
-
| 1.1741 | 1.0575 | 43 |
|
88 |
-
| 1.1854 | 1.1024 | 44 |
|
89 |
-
| 1.1473 | 1.0656 | 45 |
|
90 |
-
| 1.1568 | 1.0983 | 46 |
|
91 |
-
| 1.1373 | 1.0441 | 47 |
|
92 |
-
| 1.1168 | 1.0559 | 48 |
|
93 |
-
| 1.1256 | 1.0653 | 49 |
|
94 |
-
| 1.1066 | 0.9999 | 50 |
|
95 |
-
| 1.1021 | 0.9710 | 51 |
|
96 |
-
| 1.0877 | 0.9592 | 52 |
|
97 |
-
| 1.0749 | 0.9846 | 53 |
|
98 |
-
| 1.0790 | 0.9816 | 54 |
|
99 |
-
| 1.0671 | 1.0013 | 55 |
|
100 |
-
| 1.0424 | 0.9643 | 56 |
|
101 |
-
| 1.0386 | 1.0248 | 57 |
|
102 |
-
| 1.0360 | 0.9749 | 58 |
|
103 |
-
| 1.0255 | 1.0094 | 59 |
|
104 |
-
| 1.0092 | 0.9702 | 60 |
|
105 |
-
| 1.0186 | 1.0089 | 61 |
|
106 |
-
| 0.9996 | 1.0227 | 62 |
|
107 |
|
108 |
|
109 |
### Framework versions
|
|
|
13 |
|
14 |
This model is a fine-tuned version of [madatnlp/ke-t5-math-py](https://huggingface.co/madatnlp/ke-t5-math-py) on an unknown dataset.
|
15 |
It achieves the following results on the evaluation set:
|
16 |
+
- Train Loss: 8.0101
|
17 |
+
- Validation Loss: 5.1280
|
18 |
+
- Epoch: 0
|
19 |
|
20 |
## Model description
|
21 |
|
|
|
41 |
|
42 |
| Train Loss | Validation Loss | Epoch |
|
43 |
|:----------:|:---------------:|:-----:|
|
44 |
+
| 8.0101 | 5.1280 | 0 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
45 |
|
46 |
|
47 |
### Framework versions
|
config.json
CHANGED
@@ -23,5 +23,5 @@
|
|
23 |
"relative_attention_num_buckets": 32,
|
24 |
"transformers_version": "4.18.0",
|
25 |
"use_cache": true,
|
26 |
-
"vocab_size":
|
27 |
}
|
|
|
23 |
"relative_attention_num_buckets": 32,
|
24 |
"transformers_version": "4.18.0",
|
25 |
"use_cache": true,
|
26 |
+
"vocab_size": 6194
|
27 |
}
|
tf_model.h5
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34be35d170f12bf69d1ad64dd6e9cfffbed53ab779d9dcbc12fa06e21a339883
|
3 |
+
size 831546704
|
tokenizer.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|