End of training
Browse files- all_results.json +3 -3
- train_results.json +3 -3
- trainer_state.json +45 -45
all_results.json
CHANGED
@@ -38,8 +38,8 @@
|
|
38 |
"predict_steps_per_second": 6.081,
|
39 |
"total_flos": 6.747257278287053e+16,
|
40 |
"train_loss": 0.6624447870913739,
|
41 |
-
"train_runtime":
|
42 |
"train_samples": 247,
|
43 |
-
"train_samples_per_second": 10.
|
44 |
-
"train_steps_per_second": 2.
|
45 |
}
|
|
|
38 |
"predict_steps_per_second": 6.081,
|
39 |
"total_flos": 6.747257278287053e+16,
|
40 |
"train_loss": 0.6624447870913739,
|
41 |
+
"train_runtime": 488.5119,
|
42 |
"train_samples": 247,
|
43 |
+
"train_samples_per_second": 10.112,
|
44 |
+
"train_steps_per_second": 2.538
|
45 |
}
|
train_results.json
CHANGED
@@ -2,8 +2,8 @@
|
|
2 |
"epoch": 14.0,
|
3 |
"total_flos": 6.747257278287053e+16,
|
4 |
"train_loss": 0.6624447870913739,
|
5 |
-
"train_runtime":
|
6 |
"train_samples": 247,
|
7 |
-
"train_samples_per_second": 10.
|
8 |
-
"train_steps_per_second": 2.
|
9 |
}
|
|
|
2 |
"epoch": 14.0,
|
3 |
"total_flos": 6.747257278287053e+16,
|
4 |
"train_loss": 0.6624447870913739,
|
5 |
+
"train_runtime": 488.5119,
|
6 |
"train_samples": 247,
|
7 |
+
"train_samples_per_second": 10.112,
|
8 |
+
"train_steps_per_second": 2.538
|
9 |
}
|
trainer_state.json
CHANGED
@@ -18,9 +18,9 @@
|
|
18 |
"eval_precision-micro": 0.6509204584925321,
|
19 |
"eval_recall-macro": 0.24249037703341708,
|
20 |
"eval_recall-micro": 0.6509204584925321,
|
21 |
-
"eval_runtime": 1.
|
22 |
-
"eval_samples_per_second":
|
23 |
-
"eval_steps_per_second":
|
24 |
"step": 62
|
25 |
},
|
26 |
{
|
@@ -33,9 +33,9 @@
|
|
33 |
"eval_precision-micro": 0.7349774227162209,
|
34 |
"eval_recall-macro": 0.5291052629047126,
|
35 |
"eval_recall-micro": 0.7349774227162209,
|
36 |
-
"eval_runtime":
|
37 |
-
"eval_samples_per_second":
|
38 |
-
"eval_steps_per_second":
|
39 |
"step": 124
|
40 |
},
|
41 |
{
|
@@ -48,9 +48,9 @@
|
|
48 |
"eval_precision-micro": 0.7342827370614797,
|
49 |
"eval_recall-macro": 0.5381948279596481,
|
50 |
"eval_recall-micro": 0.7342827370614797,
|
51 |
-
"eval_runtime": 1.
|
52 |
-
"eval_samples_per_second":
|
53 |
-
"eval_steps_per_second": 5.
|
54 |
"step": 186
|
55 |
},
|
56 |
{
|
@@ -63,9 +63,9 @@
|
|
63 |
"eval_precision-micro": 0.7502605071205279,
|
64 |
"eval_recall-macro": 0.5200955397553431,
|
65 |
"eval_recall-micro": 0.7502605071205279,
|
66 |
-
"eval_runtime":
|
67 |
-
"eval_samples_per_second":
|
68 |
-
"eval_steps_per_second":
|
69 |
"step": 248
|
70 |
},
|
71 |
{
|
@@ -78,9 +78,9 @@
|
|
78 |
"eval_precision-micro": 0.7641542202153525,
|
79 |
"eval_recall-macro": 0.5462553107739512,
|
80 |
"eval_recall-micro": 0.7641542202153525,
|
81 |
-
"eval_runtime":
|
82 |
-
"eval_samples_per_second":
|
83 |
-
"eval_steps_per_second":
|
84 |
"step": 310
|
85 |
},
|
86 |
{
|
@@ -93,9 +93,9 @@
|
|
93 |
"eval_precision-micro": 0.774574505036471,
|
94 |
"eval_recall-macro": 0.5431283891127849,
|
95 |
"eval_recall-micro": 0.774574505036471,
|
96 |
-
"eval_runtime":
|
97 |
-
"eval_samples_per_second":
|
98 |
-
"eval_steps_per_second":
|
99 |
"step": 372
|
100 |
},
|
101 |
{
|
@@ -108,9 +108,9 @@
|
|
108 |
"eval_precision-micro": 0.7811740187565127,
|
109 |
"eval_recall-macro": 0.5125569147899907,
|
110 |
"eval_recall-micro": 0.7811740187565127,
|
111 |
-
"eval_runtime": 1.
|
112 |
-
"eval_samples_per_second":
|
113 |
-
"eval_steps_per_second":
|
114 |
"step": 434
|
115 |
},
|
116 |
{
|
@@ -123,9 +123,9 @@
|
|
123 |
"eval_precision-micro": 0.7825633900659952,
|
124 |
"eval_recall-macro": 0.5470775441802167,
|
125 |
"eval_recall-micro": 0.7825633900659952,
|
126 |
-
"eval_runtime": 1.
|
127 |
-
"eval_samples_per_second":
|
128 |
-
"eval_steps_per_second":
|
129 |
"step": 496
|
130 |
},
|
131 |
{
|
@@ -145,9 +145,9 @@
|
|
145 |
"eval_precision-micro": 0.7735324765543592,
|
146 |
"eval_recall-macro": 0.5818475586367124,
|
147 |
"eval_recall-micro": 0.7735324765543592,
|
148 |
-
"eval_runtime": 1.
|
149 |
-
"eval_samples_per_second":
|
150 |
-
"eval_steps_per_second":
|
151 |
"step": 558
|
152 |
},
|
153 |
{
|
@@ -160,9 +160,9 @@
|
|
160 |
"eval_precision-micro": 0.7783952761375478,
|
161 |
"eval_recall-macro": 0.5655629578179421,
|
162 |
"eval_recall-micro": 0.7783952761375478,
|
163 |
-
"eval_runtime":
|
164 |
-
"eval_samples_per_second":
|
165 |
-
"eval_steps_per_second":
|
166 |
"step": 620
|
167 |
},
|
168 |
{
|
@@ -175,9 +175,9 @@
|
|
175 |
"eval_precision-micro": 0.7829107328933658,
|
176 |
"eval_recall-macro": 0.5834711775606751,
|
177 |
"eval_recall-micro": 0.7829107328933658,
|
178 |
-
"eval_runtime":
|
179 |
-
"eval_samples_per_second":
|
180 |
-
"eval_steps_per_second":
|
181 |
"step": 682
|
182 |
},
|
183 |
{
|
@@ -190,9 +190,9 @@
|
|
190 |
"eval_precision-micro": 0.7738798193817298,
|
191 |
"eval_recall-macro": 0.5885123710730829,
|
192 |
"eval_recall-micro": 0.7738798193817298,
|
193 |
-
"eval_runtime": 1.
|
194 |
-
"eval_samples_per_second":
|
195 |
-
"eval_steps_per_second": 5.
|
196 |
"step": 744
|
197 |
},
|
198 |
{
|
@@ -205,9 +205,9 @@
|
|
205 |
"eval_precision-micro": 0.7780479333101772,
|
206 |
"eval_recall-macro": 0.5748658781079373,
|
207 |
"eval_recall-micro": 0.7780479333101772,
|
208 |
-
"eval_runtime":
|
209 |
-
"eval_samples_per_second":
|
210 |
-
"eval_steps_per_second":
|
211 |
"step": 806
|
212 |
},
|
213 |
{
|
@@ -220,9 +220,9 @@
|
|
220 |
"eval_precision-micro": 0.7797846474470302,
|
221 |
"eval_recall-macro": 0.5868004304340952,
|
222 |
"eval_recall-micro": 0.7797846474470302,
|
223 |
-
"eval_runtime": 2.
|
224 |
-
"eval_samples_per_second":
|
225 |
-
"eval_steps_per_second": 3.
|
226 |
"step": 868
|
227 |
},
|
228 |
{
|
@@ -230,9 +230,9 @@
|
|
230 |
"step": 868,
|
231 |
"total_flos": 6.747257278287053e+16,
|
232 |
"train_loss": 0.6624447870913739,
|
233 |
-
"train_runtime":
|
234 |
-
"train_samples_per_second": 10.
|
235 |
-
"train_steps_per_second": 2.
|
236 |
}
|
237 |
],
|
238 |
"logging_steps": 500,
|
|
|
18 |
"eval_precision-micro": 0.6509204584925321,
|
19 |
"eval_recall-macro": 0.24249037703341708,
|
20 |
"eval_recall-micro": 0.6509204584925321,
|
21 |
+
"eval_runtime": 1.5286,
|
22 |
+
"eval_samples_per_second": 19.625,
|
23 |
+
"eval_steps_per_second": 5.233,
|
24 |
"step": 62
|
25 |
},
|
26 |
{
|
|
|
33 |
"eval_precision-micro": 0.7349774227162209,
|
34 |
"eval_recall-macro": 0.5291052629047126,
|
35 |
"eval_recall-micro": 0.7349774227162209,
|
36 |
+
"eval_runtime": 1.6436,
|
37 |
+
"eval_samples_per_second": 18.252,
|
38 |
+
"eval_steps_per_second": 4.867,
|
39 |
"step": 124
|
40 |
},
|
41 |
{
|
|
|
48 |
"eval_precision-micro": 0.7342827370614797,
|
49 |
"eval_recall-macro": 0.5381948279596481,
|
50 |
"eval_recall-micro": 0.7342827370614797,
|
51 |
+
"eval_runtime": 1.5882,
|
52 |
+
"eval_samples_per_second": 18.889,
|
53 |
+
"eval_steps_per_second": 5.037,
|
54 |
"step": 186
|
55 |
},
|
56 |
{
|
|
|
63 |
"eval_precision-micro": 0.7502605071205279,
|
64 |
"eval_recall-macro": 0.5200955397553431,
|
65 |
"eval_recall-micro": 0.7502605071205279,
|
66 |
+
"eval_runtime": 1.601,
|
67 |
+
"eval_samples_per_second": 18.738,
|
68 |
+
"eval_steps_per_second": 4.997,
|
69 |
"step": 248
|
70 |
},
|
71 |
{
|
|
|
78 |
"eval_precision-micro": 0.7641542202153525,
|
79 |
"eval_recall-macro": 0.5462553107739512,
|
80 |
"eval_recall-micro": 0.7641542202153525,
|
81 |
+
"eval_runtime": 2.1379,
|
82 |
+
"eval_samples_per_second": 14.032,
|
83 |
+
"eval_steps_per_second": 3.742,
|
84 |
"step": 310
|
85 |
},
|
86 |
{
|
|
|
93 |
"eval_precision-micro": 0.774574505036471,
|
94 |
"eval_recall-macro": 0.5431283891127849,
|
95 |
"eval_recall-micro": 0.774574505036471,
|
96 |
+
"eval_runtime": 2.1932,
|
97 |
+
"eval_samples_per_second": 13.679,
|
98 |
+
"eval_steps_per_second": 3.648,
|
99 |
"step": 372
|
100 |
},
|
101 |
{
|
|
|
108 |
"eval_precision-micro": 0.7811740187565127,
|
109 |
"eval_recall-macro": 0.5125569147899907,
|
110 |
"eval_recall-micro": 0.7811740187565127,
|
111 |
+
"eval_runtime": 1.6371,
|
112 |
+
"eval_samples_per_second": 18.326,
|
113 |
+
"eval_steps_per_second": 4.887,
|
114 |
"step": 434
|
115 |
},
|
116 |
{
|
|
|
123 |
"eval_precision-micro": 0.7825633900659952,
|
124 |
"eval_recall-macro": 0.5470775441802167,
|
125 |
"eval_recall-micro": 0.7825633900659952,
|
126 |
+
"eval_runtime": 1.6786,
|
127 |
+
"eval_samples_per_second": 17.872,
|
128 |
+
"eval_steps_per_second": 4.766,
|
129 |
"step": 496
|
130 |
},
|
131 |
{
|
|
|
145 |
"eval_precision-micro": 0.7735324765543592,
|
146 |
"eval_recall-macro": 0.5818475586367124,
|
147 |
"eval_recall-micro": 0.7735324765543592,
|
148 |
+
"eval_runtime": 1.5468,
|
149 |
+
"eval_samples_per_second": 19.395,
|
150 |
+
"eval_steps_per_second": 5.172,
|
151 |
"step": 558
|
152 |
},
|
153 |
{
|
|
|
160 |
"eval_precision-micro": 0.7783952761375478,
|
161 |
"eval_recall-macro": 0.5655629578179421,
|
162 |
"eval_recall-micro": 0.7783952761375478,
|
163 |
+
"eval_runtime": 2.2548,
|
164 |
+
"eval_samples_per_second": 13.305,
|
165 |
+
"eval_steps_per_second": 3.548,
|
166 |
"step": 620
|
167 |
},
|
168 |
{
|
|
|
175 |
"eval_precision-micro": 0.7829107328933658,
|
176 |
"eval_recall-macro": 0.5834711775606751,
|
177 |
"eval_recall-micro": 0.7829107328933658,
|
178 |
+
"eval_runtime": 2.2566,
|
179 |
+
"eval_samples_per_second": 13.295,
|
180 |
+
"eval_steps_per_second": 3.545,
|
181 |
"step": 682
|
182 |
},
|
183 |
{
|
|
|
190 |
"eval_precision-micro": 0.7738798193817298,
|
191 |
"eval_recall-macro": 0.5885123710730829,
|
192 |
"eval_recall-micro": 0.7738798193817298,
|
193 |
+
"eval_runtime": 1.5545,
|
194 |
+
"eval_samples_per_second": 19.299,
|
195 |
+
"eval_steps_per_second": 5.146,
|
196 |
"step": 744
|
197 |
},
|
198 |
{
|
|
|
205 |
"eval_precision-micro": 0.7780479333101772,
|
206 |
"eval_recall-macro": 0.5748658781079373,
|
207 |
"eval_recall-micro": 0.7780479333101772,
|
208 |
+
"eval_runtime": 1.5795,
|
209 |
+
"eval_samples_per_second": 18.993,
|
210 |
+
"eval_steps_per_second": 5.065,
|
211 |
"step": 806
|
212 |
},
|
213 |
{
|
|
|
220 |
"eval_precision-micro": 0.7797846474470302,
|
221 |
"eval_recall-macro": 0.5868004304340952,
|
222 |
"eval_recall-micro": 0.7797846474470302,
|
223 |
+
"eval_runtime": 2.326,
|
224 |
+
"eval_samples_per_second": 12.898,
|
225 |
+
"eval_steps_per_second": 3.439,
|
226 |
"step": 868
|
227 |
},
|
228 |
{
|
|
|
230 |
"step": 868,
|
231 |
"total_flos": 6.747257278287053e+16,
|
232 |
"train_loss": 0.6624447870913739,
|
233 |
+
"train_runtime": 488.5119,
|
234 |
+
"train_samples_per_second": 10.112,
|
235 |
+
"train_steps_per_second": 2.538
|
236 |
}
|
237 |
],
|
238 |
"logging_steps": 500,
|