End of training
Browse files- README.md +11 -11
- model.safetensors +1 -1
- runs/Feb28_13-41-13_3897ec21fae5/events.out.tfevents.1709127675.3897ec21fae5.21575.0 +3 -0
- tokenizer.json +81 -19
- training_args.bin +1 -1
README.md
CHANGED
@@ -13,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
|
|
13 |
|
14 |
This model is a fine-tuned version of [](https://huggingface.co/) on the None dataset.
|
15 |
It achieves the following results on the evaluation set:
|
16 |
-
- Loss: 0.
|
17 |
|
18 |
## Model description
|
19 |
|
@@ -44,16 +44,16 @@ The following hyperparameters were used during training:
|
|
44 |
|
45 |
| Training Loss | Epoch | Step | Validation Loss |
|
46 |
|:-------------:|:-----:|:----:|:---------------:|
|
47 |
-
| 2.
|
48 |
-
|
|
49 |
-
| 1.
|
50 |
-
| 1.
|
51 |
-
| 1.
|
52 |
-
|
|
53 |
-
| 0.
|
54 |
-
| 0.
|
55 |
-
| 0.
|
56 |
-
| 0.
|
57 |
|
58 |
|
59 |
### Framework versions
|
|
|
13 |
|
14 |
This model is a fine-tuned version of [](https://huggingface.co/) on the None dataset.
|
15 |
It achieves the following results on the evaluation set:
|
16 |
+
- Loss: 0.7400
|
17 |
|
18 |
## Model description
|
19 |
|
|
|
44 |
|
45 |
| Training Loss | Epoch | Step | Validation Loss |
|
46 |
|:-------------:|:-----:|:----:|:---------------:|
|
47 |
+
| 2.966 | 1.0 | 6 | 2.2765 |
|
48 |
+
| 2.0606 | 2.0 | 12 | 1.7855 |
|
49 |
+
| 1.6303 | 3.0 | 18 | 1.4249 |
|
50 |
+
| 1.2968 | 4.0 | 24 | 1.1742 |
|
51 |
+
| 1.1342 | 5.0 | 30 | 1.0421 |
|
52 |
+
| 0.9916 | 6.0 | 36 | 0.9159 |
|
53 |
+
| 0.8864 | 7.0 | 42 | 0.8410 |
|
54 |
+
| 0.8119 | 8.0 | 48 | 0.7857 |
|
55 |
+
| 0.7691 | 9.0 | 54 | 0.7509 |
|
56 |
+
| 0.7515 | 10.0 | 60 | 0.7400 |
|
57 |
|
58 |
|
59 |
### Framework versions
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 31213760
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52242b7293996d19398d1cb5904e713f5bce9bdcddfa61064c3e552d21d77ae3
|
3 |
size 31213760
|
runs/Feb28_13-41-13_3897ec21fae5/events.out.tfevents.1709127675.3897ec21fae5.21575.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0421b0459a1f756991e9096e9a3c2ce821a636db440b83873ad27b613c136813
|
3 |
+
size 12864
|
tokenizer.json
CHANGED
@@ -71,7 +71,69 @@
|
|
71 |
"pre_tokenizer": {
|
72 |
"type": "Whitespace"
|
73 |
},
|
74 |
-
"post_processor":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
75 |
"decoder": null,
|
76 |
"model": {
|
77 |
"type": "BPE",
|
@@ -106,18 +168,18 @@
|
|
106 |
"10": 21,
|
107 |
"98": 22,
|
108 |
"11": 23,
|
109 |
-
"
|
110 |
-
"
|
111 |
-
"
|
112 |
-
"
|
113 |
"95": 28,
|
114 |
"14": 29,
|
115 |
"94": 30,
|
116 |
"15": 31,
|
117 |
-
"
|
118 |
-
"
|
119 |
-
"
|
120 |
-
"
|
121 |
"91": 36,
|
122 |
"18": 37,
|
123 |
"19": 38,
|
@@ -130,10 +192,10 @@
|
|
130 |
"87": 45,
|
131 |
"23": 46,
|
132 |
"86": 47,
|
133 |
-
"
|
134 |
-
"
|
135 |
-
"
|
136 |
-
"
|
137 |
"26": 52,
|
138 |
"83": 53,
|
139 |
"27": 54,
|
@@ -144,18 +206,18 @@
|
|
144 |
"1 0",
|
145 |
"9 8",
|
146 |
"1 1",
|
147 |
-
"1 2",
|
148 |
"9 7",
|
149 |
-
"1
|
150 |
"9 6",
|
|
|
151 |
"9 5",
|
152 |
"1 4",
|
153 |
"9 4",
|
154 |
"1 5",
|
155 |
-
"1 6",
|
156 |
"9 3",
|
157 |
-
"1
|
158 |
"9 2",
|
|
|
159 |
"9 1",
|
160 |
"1 8",
|
161 |
"1 9",
|
@@ -168,10 +230,10 @@
|
|
168 |
"8 7",
|
169 |
"2 3",
|
170 |
"8 6",
|
171 |
-
"2 4",
|
172 |
"8 5",
|
173 |
-
"
|
174 |
"2 5",
|
|
|
175 |
"2 6",
|
176 |
"8 3",
|
177 |
"2 7",
|
|
|
71 |
"pre_tokenizer": {
|
72 |
"type": "Whitespace"
|
73 |
},
|
74 |
+
"post_processor": {
|
75 |
+
"type": "TemplateProcessing",
|
76 |
+
"single": [
|
77 |
+
{
|
78 |
+
"Sequence": {
|
79 |
+
"id": "A",
|
80 |
+
"type_id": 0
|
81 |
+
}
|
82 |
+
},
|
83 |
+
{
|
84 |
+
"SpecialToken": {
|
85 |
+
"id": "[CLS]",
|
86 |
+
"type_id": 0
|
87 |
+
}
|
88 |
+
}
|
89 |
+
],
|
90 |
+
"pair": [
|
91 |
+
{
|
92 |
+
"Sequence": {
|
93 |
+
"id": "A",
|
94 |
+
"type_id": 0
|
95 |
+
}
|
96 |
+
},
|
97 |
+
{
|
98 |
+
"SpecialToken": {
|
99 |
+
"id": "[CLS]",
|
100 |
+
"type_id": 0
|
101 |
+
}
|
102 |
+
},
|
103 |
+
{
|
104 |
+
"Sequence": {
|
105 |
+
"id": "B",
|
106 |
+
"type_id": 1
|
107 |
+
}
|
108 |
+
},
|
109 |
+
{
|
110 |
+
"SpecialToken": {
|
111 |
+
"id": "[EOS]",
|
112 |
+
"type_id": 1
|
113 |
+
}
|
114 |
+
}
|
115 |
+
],
|
116 |
+
"special_tokens": {
|
117 |
+
"[CLS]": {
|
118 |
+
"id": "[CLS]",
|
119 |
+
"ids": [
|
120 |
+
0
|
121 |
+
],
|
122 |
+
"tokens": [
|
123 |
+
"[CLS]"
|
124 |
+
]
|
125 |
+
},
|
126 |
+
"[EOS]": {
|
127 |
+
"id": "[EOS]",
|
128 |
+
"ids": [
|
129 |
+
1
|
130 |
+
],
|
131 |
+
"tokens": [
|
132 |
+
"[EOS]"
|
133 |
+
]
|
134 |
+
}
|
135 |
+
}
|
136 |
+
},
|
137 |
"decoder": null,
|
138 |
"model": {
|
139 |
"type": "BPE",
|
|
|
168 |
"10": 21,
|
169 |
"98": 22,
|
170 |
"11": 23,
|
171 |
+
"97": 24,
|
172 |
+
"12": 25,
|
173 |
+
"96": 26,
|
174 |
+
"13": 27,
|
175 |
"95": 28,
|
176 |
"14": 29,
|
177 |
"94": 30,
|
178 |
"15": 31,
|
179 |
+
"93": 32,
|
180 |
+
"16": 33,
|
181 |
+
"92": 34,
|
182 |
+
"17": 35,
|
183 |
"91": 36,
|
184 |
"18": 37,
|
185 |
"19": 38,
|
|
|
192 |
"87": 45,
|
193 |
"23": 46,
|
194 |
"86": 47,
|
195 |
+
"85": 48,
|
196 |
+
"24": 49,
|
197 |
+
"25": 50,
|
198 |
+
"84": 51,
|
199 |
"26": 52,
|
200 |
"83": 53,
|
201 |
"27": 54,
|
|
|
206 |
"1 0",
|
207 |
"9 8",
|
208 |
"1 1",
|
|
|
209 |
"9 7",
|
210 |
+
"1 2",
|
211 |
"9 6",
|
212 |
+
"1 3",
|
213 |
"9 5",
|
214 |
"1 4",
|
215 |
"9 4",
|
216 |
"1 5",
|
|
|
217 |
"9 3",
|
218 |
+
"1 6",
|
219 |
"9 2",
|
220 |
+
"1 7",
|
221 |
"9 1",
|
222 |
"1 8",
|
223 |
"1 9",
|
|
|
230 |
"8 7",
|
231 |
"2 3",
|
232 |
"8 6",
|
|
|
233 |
"8 5",
|
234 |
+
"2 4",
|
235 |
"2 5",
|
236 |
+
"8 4",
|
237 |
"2 6",
|
238 |
"8 3",
|
239 |
"2 7",
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4920
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e54a33d2f290f85e42924b5f98306a6bedf48ced4afa93e90600479ea6cfd23f
|
3 |
size 4920
|