jorgeortizfuentes
commited on
Commit
•
d39ed56
1
Parent(s):
d5aa309
End of training
Browse files
all_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"epoch": 5.0,
|
3 |
-
"train_loss": 0.
|
4 |
-
"train_runtime":
|
5 |
"train_samples": 1120,
|
6 |
-
"train_samples_per_second":
|
7 |
-
"train_steps_per_second":
|
8 |
}
|
|
|
1 |
{
|
2 |
"epoch": 5.0,
|
3 |
+
"train_loss": 0.17726608804294042,
|
4 |
+
"train_runtime": 611.8323,
|
5 |
"train_samples": 1120,
|
6 |
+
"train_samples_per_second": 9.153,
|
7 |
+
"train_steps_per_second": 1.144
|
8 |
}
|
predict_results_fake-news.txt
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
index prediction
|
2 |
0 1
|
3 |
-
1
|
4 |
2 1
|
5 |
3 1
|
6 |
4 1
|
@@ -35,13 +35,13 @@ index prediction
|
|
35 |
33 1
|
36 |
34 1
|
37 |
35 1
|
38 |
-
36
|
39 |
37 1
|
40 |
38 0
|
41 |
39 0
|
42 |
40 0
|
43 |
41 1
|
44 |
-
42
|
45 |
43 1
|
46 |
44 0
|
47 |
45 0
|
@@ -54,7 +54,7 @@ index prediction
|
|
54 |
52 0
|
55 |
53 1
|
56 |
54 1
|
57 |
-
55
|
58 |
56 0
|
59 |
57 1
|
60 |
58 1
|
@@ -64,7 +64,7 @@ index prediction
|
|
64 |
62 1
|
65 |
63 0
|
66 |
64 1
|
67 |
-
65
|
68 |
66 1
|
69 |
67 0
|
70 |
68 0
|
@@ -75,8 +75,8 @@ index prediction
|
|
75 |
73 1
|
76 |
74 1
|
77 |
75 0
|
78 |
-
76
|
79 |
-
77
|
80 |
78 0
|
81 |
79 1
|
82 |
80 1
|
@@ -107,7 +107,7 @@ index prediction
|
|
107 |
105 1
|
108 |
106 0
|
109 |
107 1
|
110 |
-
108
|
111 |
109 1
|
112 |
110 0
|
113 |
111 0
|
@@ -133,7 +133,7 @@ index prediction
|
|
133 |
131 1
|
134 |
132 0
|
135 |
133 0
|
136 |
-
134
|
137 |
135 1
|
138 |
136 1
|
139 |
137 1
|
@@ -148,7 +148,7 @@ index prediction
|
|
148 |
146 0
|
149 |
147 1
|
150 |
148 1
|
151 |
-
149
|
152 |
150 0
|
153 |
151 1
|
154 |
152 0
|
@@ -162,11 +162,11 @@ index prediction
|
|
162 |
160 1
|
163 |
161 0
|
164 |
162 0
|
165 |
-
163
|
166 |
164 1
|
167 |
-
165
|
168 |
166 0
|
169 |
-
167
|
170 |
168 0
|
171 |
169 1
|
172 |
170 1
|
@@ -187,17 +187,17 @@ index prediction
|
|
187 |
185 1
|
188 |
186 0
|
189 |
187 0
|
190 |
-
188
|
191 |
189 0
|
192 |
190 0
|
193 |
191 0
|
194 |
-
192
|
195 |
193 1
|
196 |
194 0
|
197 |
195 1
|
198 |
196 0
|
199 |
197 1
|
200 |
-
198
|
201 |
199 1
|
202 |
200 0
|
203 |
201 1
|
@@ -218,7 +218,7 @@ index prediction
|
|
218 |
216 0
|
219 |
217 0
|
220 |
218 1
|
221 |
-
219
|
222 |
220 1
|
223 |
221 0
|
224 |
222 1
|
|
|
1 |
index prediction
|
2 |
0 1
|
3 |
+
1 0
|
4 |
2 1
|
5 |
3 1
|
6 |
4 1
|
|
|
35 |
33 1
|
36 |
34 1
|
37 |
35 1
|
38 |
+
36 0
|
39 |
37 1
|
40 |
38 0
|
41 |
39 0
|
42 |
40 0
|
43 |
41 1
|
44 |
+
42 0
|
45 |
43 1
|
46 |
44 0
|
47 |
45 0
|
|
|
54 |
52 0
|
55 |
53 1
|
56 |
54 1
|
57 |
+
55 1
|
58 |
56 0
|
59 |
57 1
|
60 |
58 1
|
|
|
64 |
62 1
|
65 |
63 0
|
66 |
64 1
|
67 |
+
65 0
|
68 |
66 1
|
69 |
67 0
|
70 |
68 0
|
|
|
75 |
73 1
|
76 |
74 1
|
77 |
75 0
|
78 |
+
76 1
|
79 |
+
77 1
|
80 |
78 0
|
81 |
79 1
|
82 |
80 1
|
|
|
107 |
105 1
|
108 |
106 0
|
109 |
107 1
|
110 |
+
108 0
|
111 |
109 1
|
112 |
110 0
|
113 |
111 0
|
|
|
133 |
131 1
|
134 |
132 0
|
135 |
133 0
|
136 |
+
134 1
|
137 |
135 1
|
138 |
136 1
|
139 |
137 1
|
|
|
148 |
146 0
|
149 |
147 1
|
150 |
148 1
|
151 |
+
149 0
|
152 |
150 0
|
153 |
151 1
|
154 |
152 0
|
|
|
162 |
160 1
|
163 |
161 0
|
164 |
162 0
|
165 |
+
163 0
|
166 |
164 1
|
167 |
+
165 1
|
168 |
166 0
|
169 |
+
167 0
|
170 |
168 0
|
171 |
169 1
|
172 |
170 1
|
|
|
187 |
185 1
|
188 |
186 0
|
189 |
187 0
|
190 |
+
188 1
|
191 |
189 0
|
192 |
190 0
|
193 |
191 0
|
194 |
+
192 0
|
195 |
193 1
|
196 |
194 0
|
197 |
195 1
|
198 |
196 0
|
199 |
197 1
|
200 |
+
198 0
|
201 |
199 1
|
202 |
200 0
|
203 |
201 1
|
|
|
218 |
216 0
|
219 |
217 0
|
220 |
218 1
|
221 |
+
219 1
|
222 |
220 1
|
223 |
221 0
|
224 |
222 1
|
runs/Jul05_08-58-57_0a840cd07d02/events.out.tfevents.1688548330.0a840cd07d02.804.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0932018f9cd7bb8d4c7eae2371dcae97e28e0102b2021870b1ea0cd5abd1ab0b
|
3 |
+
size 405
|
train_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"epoch": 5.0,
|
3 |
-
"train_loss": 0.
|
4 |
-
"train_runtime":
|
5 |
"train_samples": 1120,
|
6 |
-
"train_samples_per_second":
|
7 |
-
"train_steps_per_second":
|
8 |
}
|
|
|
1 |
{
|
2 |
"epoch": 5.0,
|
3 |
+
"train_loss": 0.17726608804294042,
|
4 |
+
"train_runtime": 611.8323,
|
5 |
"train_samples": 1120,
|
6 |
+
"train_samples_per_second": 9.153,
|
7 |
+
"train_steps_per_second": 1.144
|
8 |
}
|
trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "models/fake-news-bert-base-spanish-wwm-cased/checkpoint-
|
4 |
"epoch": 5.0,
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -10,89 +10,89 @@
|
|
10 |
{
|
11 |
"epoch": 1.0,
|
12 |
"learning_rate": 1.6000000000000003e-05,
|
13 |
-
"loss": 0.
|
14 |
-
"step":
|
15 |
},
|
16 |
{
|
17 |
"epoch": 1.0,
|
18 |
-
"eval_f1": 0.
|
19 |
-
"eval_loss": 0.
|
20 |
-
"eval_runtime":
|
21 |
-
"eval_samples_per_second":
|
22 |
-
"eval_steps_per_second":
|
23 |
-
"step":
|
24 |
},
|
25 |
{
|
26 |
"epoch": 2.0,
|
27 |
"learning_rate": 1.2e-05,
|
28 |
-
"loss": 0.
|
29 |
-
"step":
|
30 |
},
|
31 |
{
|
32 |
"epoch": 2.0,
|
33 |
-
"eval_f1": 0.
|
34 |
-
"eval_loss": 0.
|
35 |
-
"eval_runtime":
|
36 |
-
"eval_samples_per_second":
|
37 |
-
"eval_steps_per_second":
|
38 |
-
"step":
|
39 |
},
|
40 |
{
|
41 |
"epoch": 3.0,
|
42 |
"learning_rate": 8.000000000000001e-06,
|
43 |
-
"loss": 0.
|
44 |
-
"step":
|
45 |
},
|
46 |
{
|
47 |
"epoch": 3.0,
|
48 |
-
"eval_f1": 0.
|
49 |
-
"eval_loss": 0.
|
50 |
-
"eval_runtime":
|
51 |
-
"eval_samples_per_second":
|
52 |
-
"eval_steps_per_second":
|
53 |
-
"step":
|
54 |
},
|
55 |
{
|
56 |
"epoch": 4.0,
|
57 |
"learning_rate": 4.000000000000001e-06,
|
58 |
-
"loss": 0.
|
59 |
-
"step":
|
60 |
},
|
61 |
{
|
62 |
"epoch": 4.0,
|
63 |
-
"eval_f1": 0.
|
64 |
-
"eval_loss": 0.
|
65 |
-
"eval_runtime":
|
66 |
-
"eval_samples_per_second":
|
67 |
-
"eval_steps_per_second":
|
68 |
-
"step":
|
69 |
},
|
70 |
{
|
71 |
"epoch": 5.0,
|
72 |
"learning_rate": 0.0,
|
73 |
-
"loss": 0.
|
74 |
-
"step":
|
75 |
},
|
76 |
{
|
77 |
"epoch": 5.0,
|
78 |
-
"eval_f1": 0.
|
79 |
-
"eval_loss": 0.
|
80 |
-
"eval_runtime":
|
81 |
-
"eval_samples_per_second":
|
82 |
-
"eval_steps_per_second":
|
83 |
-
"step":
|
84 |
},
|
85 |
{
|
86 |
"epoch": 5.0,
|
87 |
-
"step":
|
88 |
"total_flos": 1473421910016000.0,
|
89 |
-
"train_loss": 0.
|
90 |
-
"train_runtime":
|
91 |
-
"train_samples_per_second":
|
92 |
-
"train_steps_per_second":
|
93 |
}
|
94 |
],
|
95 |
-
"max_steps":
|
96 |
"num_train_epochs": 5,
|
97 |
"total_flos": 1473421910016000.0,
|
98 |
"trial_name": null,
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.8968609865470851,
|
3 |
+
"best_model_checkpoint": "models/fake-news-bert-base-spanish-wwm-cased/checkpoint-420",
|
4 |
"epoch": 5.0,
|
5 |
+
"global_step": 700,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
10 |
{
|
11 |
"epoch": 1.0,
|
12 |
"learning_rate": 1.6000000000000003e-05,
|
13 |
+
"loss": 0.5098,
|
14 |
+
"step": 140
|
15 |
},
|
16 |
{
|
17 |
"epoch": 1.0,
|
18 |
+
"eval_f1": 0.7340425531914895,
|
19 |
+
"eval_loss": 0.49776777625083923,
|
20 |
+
"eval_runtime": 8.4133,
|
21 |
+
"eval_samples_per_second": 28.526,
|
22 |
+
"eval_steps_per_second": 3.566,
|
23 |
+
"step": 140
|
24 |
},
|
25 |
{
|
26 |
"epoch": 2.0,
|
27 |
"learning_rate": 1.2e-05,
|
28 |
+
"loss": 0.2473,
|
29 |
+
"step": 280
|
30 |
},
|
31 |
{
|
32 |
"epoch": 2.0,
|
33 |
+
"eval_f1": 0.8828828828828829,
|
34 |
+
"eval_loss": 0.38877564668655396,
|
35 |
+
"eval_runtime": 8.625,
|
36 |
+
"eval_samples_per_second": 27.826,
|
37 |
+
"eval_steps_per_second": 3.478,
|
38 |
+
"step": 280
|
39 |
},
|
40 |
{
|
41 |
"epoch": 3.0,
|
42 |
"learning_rate": 8.000000000000001e-06,
|
43 |
+
"loss": 0.0908,
|
44 |
+
"step": 420
|
45 |
},
|
46 |
{
|
47 |
"epoch": 3.0,
|
48 |
+
"eval_f1": 0.8968609865470851,
|
49 |
+
"eval_loss": 0.44203802943229675,
|
50 |
+
"eval_runtime": 8.4917,
|
51 |
+
"eval_samples_per_second": 28.263,
|
52 |
+
"eval_steps_per_second": 3.533,
|
53 |
+
"step": 420
|
54 |
},
|
55 |
{
|
56 |
"epoch": 4.0,
|
57 |
"learning_rate": 4.000000000000001e-06,
|
58 |
+
"loss": 0.0332,
|
59 |
+
"step": 560
|
60 |
},
|
61 |
{
|
62 |
"epoch": 4.0,
|
63 |
+
"eval_f1": 0.8796296296296298,
|
64 |
+
"eval_loss": 0.5603806376457214,
|
65 |
+
"eval_runtime": 8.5449,
|
66 |
+
"eval_samples_per_second": 28.087,
|
67 |
+
"eval_steps_per_second": 3.511,
|
68 |
+
"step": 560
|
69 |
},
|
70 |
{
|
71 |
"epoch": 5.0,
|
72 |
"learning_rate": 0.0,
|
73 |
+
"loss": 0.0052,
|
74 |
+
"step": 700
|
75 |
},
|
76 |
{
|
77 |
"epoch": 5.0,
|
78 |
+
"eval_f1": 0.8956521739130435,
|
79 |
+
"eval_loss": 0.5154075622558594,
|
80 |
+
"eval_runtime": 8.6086,
|
81 |
+
"eval_samples_per_second": 27.879,
|
82 |
+
"eval_steps_per_second": 3.485,
|
83 |
+
"step": 700
|
84 |
},
|
85 |
{
|
86 |
"epoch": 5.0,
|
87 |
+
"step": 700,
|
88 |
"total_flos": 1473421910016000.0,
|
89 |
+
"train_loss": 0.17726608804294042,
|
90 |
+
"train_runtime": 611.8323,
|
91 |
+
"train_samples_per_second": 9.153,
|
92 |
+
"train_steps_per_second": 1.144
|
93 |
}
|
94 |
],
|
95 |
+
"max_steps": 700,
|
96 |
"num_train_epochs": 5,
|
97 |
"total_flos": 1473421910016000.0,
|
98 |
"trial_name": null,
|