ludziej commited on
Commit
8736aaf
1 Parent(s): 3436e55

End of training

Browse files
README.md CHANGED
@@ -13,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  This model is a fine-tuned version of [](https://huggingface.co/) on the None dataset.
15
  It achieves the following results on the evaluation set:
16
- - Loss: 0.8243
17
 
18
  ## Model description
19
 
@@ -44,16 +44,16 @@ The following hyperparameters were used during training:
44
 
45
  | Training Loss | Epoch | Step | Validation Loss |
46
  |:-------------:|:-----:|:----:|:---------------:|
47
- | 2.8893 | 1.0 | 6 | 2.1271 |
48
- | 1.9669 | 2.0 | 12 | 1.8233 |
49
- | 1.6822 | 3.0 | 18 | 1.5134 |
50
- | 1.3991 | 4.0 | 24 | 1.2639 |
51
- | 1.1731 | 5.0 | 30 | 1.1030 |
52
- | 1.0664 | 6.0 | 36 | 0.9758 |
53
- | 0.9729 | 7.0 | 42 | 0.9245 |
54
- | 0.9171 | 8.0 | 48 | 0.8696 |
55
- | 0.8722 | 9.0 | 54 | 0.8384 |
56
- | 0.8487 | 10.0 | 60 | 0.8243 |
57
 
58
 
59
  ### Framework versions
 
13
 
14
  This model is a fine-tuned version of [](https://huggingface.co/) on the None dataset.
15
  It achieves the following results on the evaluation set:
16
+ - Loss: 0.7400
17
 
18
  ## Model description
19
 
 
44
 
45
  | Training Loss | Epoch | Step | Validation Loss |
46
  |:-------------:|:-----:|:----:|:---------------:|
47
+ | 2.966 | 1.0 | 6 | 2.2765 |
48
+ | 2.0606 | 2.0 | 12 | 1.7855 |
49
+ | 1.6303 | 3.0 | 18 | 1.4249 |
50
+ | 1.2968 | 4.0 | 24 | 1.1742 |
51
+ | 1.1342 | 5.0 | 30 | 1.0421 |
52
+ | 0.9916 | 6.0 | 36 | 0.9159 |
53
+ | 0.8864 | 7.0 | 42 | 0.8410 |
54
+ | 0.8119 | 8.0 | 48 | 0.7857 |
55
+ | 0.7691 | 9.0 | 54 | 0.7509 |
56
+ | 0.7515 | 10.0 | 60 | 0.7400 |
57
 
58
 
59
  ### Framework versions
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c786ce574c7b54427c775c1c401bc60b3a2a1bf4da9d34ebd224728b1d9fdb1
3
  size 31213760
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52242b7293996d19398d1cb5904e713f5bce9bdcddfa61064c3e552d21d77ae3
3
  size 31213760
runs/Feb28_13-41-13_3897ec21fae5/events.out.tfevents.1709127675.3897ec21fae5.21575.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0421b0459a1f756991e9096e9a3c2ce821a636db440b83873ad27b613c136813
3
+ size 12864
tokenizer.json CHANGED
@@ -71,7 +71,69 @@
71
  "pre_tokenizer": {
72
  "type": "Whitespace"
73
  },
74
- "post_processor": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
75
  "decoder": null,
76
  "model": {
77
  "type": "BPE",
@@ -106,18 +168,18 @@
106
  "10": 21,
107
  "98": 22,
108
  "11": 23,
109
- "12": 24,
110
- "97": 25,
111
- "13": 26,
112
- "96": 27,
113
  "95": 28,
114
  "14": 29,
115
  "94": 30,
116
  "15": 31,
117
- "16": 32,
118
- "93": 33,
119
- "17": 34,
120
- "92": 35,
121
  "91": 36,
122
  "18": 37,
123
  "19": 38,
@@ -130,10 +192,10 @@
130
  "87": 45,
131
  "23": 46,
132
  "86": 47,
133
- "24": 48,
134
- "85": 49,
135
- "84": 50,
136
- "25": 51,
137
  "26": 52,
138
  "83": 53,
139
  "27": 54,
@@ -144,18 +206,18 @@
144
  "1 0",
145
  "9 8",
146
  "1 1",
147
- "1 2",
148
  "9 7",
149
- "1 3",
150
  "9 6",
 
151
  "9 5",
152
  "1 4",
153
  "9 4",
154
  "1 5",
155
- "1 6",
156
  "9 3",
157
- "1 7",
158
  "9 2",
 
159
  "9 1",
160
  "1 8",
161
  "1 9",
@@ -168,10 +230,10 @@
168
  "8 7",
169
  "2 3",
170
  "8 6",
171
- "2 4",
172
  "8 5",
173
- "8 4",
174
  "2 5",
 
175
  "2 6",
176
  "8 3",
177
  "2 7",
 
71
  "pre_tokenizer": {
72
  "type": "Whitespace"
73
  },
74
+ "post_processor": {
75
+ "type": "TemplateProcessing",
76
+ "single": [
77
+ {
78
+ "Sequence": {
79
+ "id": "A",
80
+ "type_id": 0
81
+ }
82
+ },
83
+ {
84
+ "SpecialToken": {
85
+ "id": "[CLS]",
86
+ "type_id": 0
87
+ }
88
+ }
89
+ ],
90
+ "pair": [
91
+ {
92
+ "Sequence": {
93
+ "id": "A",
94
+ "type_id": 0
95
+ }
96
+ },
97
+ {
98
+ "SpecialToken": {
99
+ "id": "[CLS]",
100
+ "type_id": 0
101
+ }
102
+ },
103
+ {
104
+ "Sequence": {
105
+ "id": "B",
106
+ "type_id": 1
107
+ }
108
+ },
109
+ {
110
+ "SpecialToken": {
111
+ "id": "[EOS]",
112
+ "type_id": 1
113
+ }
114
+ }
115
+ ],
116
+ "special_tokens": {
117
+ "[CLS]": {
118
+ "id": "[CLS]",
119
+ "ids": [
120
+ 0
121
+ ],
122
+ "tokens": [
123
+ "[CLS]"
124
+ ]
125
+ },
126
+ "[EOS]": {
127
+ "id": "[EOS]",
128
+ "ids": [
129
+ 1
130
+ ],
131
+ "tokens": [
132
+ "[EOS]"
133
+ ]
134
+ }
135
+ }
136
+ },
137
  "decoder": null,
138
  "model": {
139
  "type": "BPE",
 
168
  "10": 21,
169
  "98": 22,
170
  "11": 23,
171
+ "97": 24,
172
+ "12": 25,
173
+ "96": 26,
174
+ "13": 27,
175
  "95": 28,
176
  "14": 29,
177
  "94": 30,
178
  "15": 31,
179
+ "93": 32,
180
+ "16": 33,
181
+ "92": 34,
182
+ "17": 35,
183
  "91": 36,
184
  "18": 37,
185
  "19": 38,
 
192
  "87": 45,
193
  "23": 46,
194
  "86": 47,
195
+ "85": 48,
196
+ "24": 49,
197
+ "25": 50,
198
+ "84": 51,
199
  "26": 52,
200
  "83": 53,
201
  "27": 54,
 
206
  "1 0",
207
  "9 8",
208
  "1 1",
 
209
  "9 7",
210
+ "1 2",
211
  "9 6",
212
+ "1 3",
213
  "9 5",
214
  "1 4",
215
  "9 4",
216
  "1 5",
 
217
  "9 3",
218
+ "1 6",
219
  "9 2",
220
+ "1 7",
221
  "9 1",
222
  "1 8",
223
  "1 9",
 
230
  "8 7",
231
  "2 3",
232
  "8 6",
 
233
  "8 5",
234
+ "2 4",
235
  "2 5",
236
+ "8 4",
237
  "2 6",
238
  "8 3",
239
  "2 7",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6659b0093eeff414bea7b0676fa26b8ced67d1bab20bc510776e16dcea6efb68
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e54a33d2f290f85e42924b5f98306a6bedf48ced4afa93e90600479ea6cfd23f
3
  size 4920