jorgeortizfuentes commited on
Commit
d39ed56
1 Parent(s): d5aa309

End of training

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
- "train_loss": 0.18657105684280395,
4
- "train_runtime": 93.1154,
5
  "train_samples": 1120,
6
- "train_samples_per_second": 60.14,
7
- "train_steps_per_second": 3.759
8
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "train_loss": 0.17726608804294042,
4
+ "train_runtime": 611.8323,
5
  "train_samples": 1120,
6
+ "train_samples_per_second": 9.153,
7
+ "train_steps_per_second": 1.144
8
  }
predict_results_fake-news.txt CHANGED
@@ -1,6 +1,6 @@
1
  index prediction
2
  0 1
3
- 1 1
4
  2 1
5
  3 1
6
  4 1
@@ -35,13 +35,13 @@ index prediction
35
  33 1
36
  34 1
37
  35 1
38
- 36 1
39
  37 1
40
  38 0
41
  39 0
42
  40 0
43
  41 1
44
- 42 1
45
  43 1
46
  44 0
47
  45 0
@@ -54,7 +54,7 @@ index prediction
54
  52 0
55
  53 1
56
  54 1
57
- 55 0
58
  56 0
59
  57 1
60
  58 1
@@ -64,7 +64,7 @@ index prediction
64
  62 1
65
  63 0
66
  64 1
67
- 65 1
68
  66 1
69
  67 0
70
  68 0
@@ -75,8 +75,8 @@ index prediction
75
  73 1
76
  74 1
77
  75 0
78
- 76 0
79
- 77 0
80
  78 0
81
  79 1
82
  80 1
@@ -107,7 +107,7 @@ index prediction
107
  105 1
108
  106 0
109
  107 1
110
- 108 1
111
  109 1
112
  110 0
113
  111 0
@@ -133,7 +133,7 @@ index prediction
133
  131 1
134
  132 0
135
  133 0
136
- 134 0
137
  135 1
138
  136 1
139
  137 1
@@ -148,7 +148,7 @@ index prediction
148
  146 0
149
  147 1
150
  148 1
151
- 149 1
152
  150 0
153
  151 1
154
  152 0
@@ -162,11 +162,11 @@ index prediction
162
  160 1
163
  161 0
164
  162 0
165
- 163 1
166
  164 1
167
- 165 0
168
  166 0
169
- 167 1
170
  168 0
171
  169 1
172
  170 1
@@ -187,17 +187,17 @@ index prediction
187
  185 1
188
  186 0
189
  187 0
190
- 188 0
191
  189 0
192
  190 0
193
  191 0
194
- 192 1
195
  193 1
196
  194 0
197
  195 1
198
  196 0
199
  197 1
200
- 198 1
201
  199 1
202
  200 0
203
  201 1
@@ -218,7 +218,7 @@ index prediction
218
  216 0
219
  217 0
220
  218 1
221
- 219 0
222
  220 1
223
  221 0
224
  222 1
 
1
  index prediction
2
  0 1
3
+ 1 0
4
  2 1
5
  3 1
6
  4 1
 
35
  33 1
36
  34 1
37
  35 1
38
+ 36 0
39
  37 1
40
  38 0
41
  39 0
42
  40 0
43
  41 1
44
+ 42 0
45
  43 1
46
  44 0
47
  45 0
 
54
  52 0
55
  53 1
56
  54 1
57
+ 55 1
58
  56 0
59
  57 1
60
  58 1
 
64
  62 1
65
  63 0
66
  64 1
67
+ 65 0
68
  66 1
69
  67 0
70
  68 0
 
75
  73 1
76
  74 1
77
  75 0
78
+ 76 1
79
+ 77 1
80
  78 0
81
  79 1
82
  80 1
 
107
  105 1
108
  106 0
109
  107 1
110
+ 108 0
111
  109 1
112
  110 0
113
  111 0
 
133
  131 1
134
  132 0
135
  133 0
136
+ 134 1
137
  135 1
138
  136 1
139
  137 1
 
148
  146 0
149
  147 1
150
  148 1
151
+ 149 0
152
  150 0
153
  151 1
154
  152 0
 
162
  160 1
163
  161 0
164
  162 0
165
+ 163 0
166
  164 1
167
+ 165 1
168
  166 0
169
+ 167 0
170
  168 0
171
  169 1
172
  170 1
 
187
  185 1
188
  186 0
189
  187 0
190
+ 188 1
191
  189 0
192
  190 0
193
  191 0
194
+ 192 0
195
  193 1
196
  194 0
197
  195 1
198
  196 0
199
  197 1
200
+ 198 0
201
  199 1
202
  200 0
203
  201 1
 
218
  216 0
219
  217 0
220
  218 1
221
+ 219 1
222
  220 1
223
  221 0
224
  222 1
runs/Jul05_08-58-57_0a840cd07d02/events.out.tfevents.1688548330.0a840cd07d02.804.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0932018f9cd7bb8d4c7eae2371dcae97e28e0102b2021870b1ea0cd5abd1ab0b
3
+ size 405
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
- "train_loss": 0.18657105684280395,
4
- "train_runtime": 93.1154,
5
  "train_samples": 1120,
6
- "train_samples_per_second": 60.14,
7
- "train_steps_per_second": 3.759
8
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "train_loss": 0.17726608804294042,
4
+ "train_runtime": 611.8323,
5
  "train_samples": 1120,
6
+ "train_samples_per_second": 9.153,
7
+ "train_steps_per_second": 1.144
8
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.8908296943231441,
3
- "best_model_checkpoint": "models/fake-news-bert-base-spanish-wwm-cased/checkpoint-210",
4
  "epoch": 5.0,
5
- "global_step": 350,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -10,89 +10,89 @@
10
  {
11
  "epoch": 1.0,
12
  "learning_rate": 1.6000000000000003e-05,
13
- "loss": 0.512,
14
- "step": 70
15
  },
16
  {
17
  "epoch": 1.0,
18
- "eval_f1": 0.7473684210526316,
19
- "eval_loss": 0.5346518158912659,
20
- "eval_runtime": 1.3022,
21
- "eval_samples_per_second": 184.298,
22
- "eval_steps_per_second": 11.519,
23
- "step": 70
24
  },
25
  {
26
  "epoch": 2.0,
27
  "learning_rate": 1.2e-05,
28
- "loss": 0.2281,
29
- "step": 140
30
  },
31
  {
32
  "epoch": 2.0,
33
- "eval_f1": 0.8333333333333334,
34
- "eval_loss": 0.3819647431373596,
35
- "eval_runtime": 1.3101,
36
- "eval_samples_per_second": 183.197,
37
- "eval_steps_per_second": 11.45,
38
- "step": 140
39
  },
40
  {
41
  "epoch": 3.0,
42
  "learning_rate": 8.000000000000001e-06,
43
- "loss": 0.1212,
44
- "step": 210
45
  },
46
  {
47
  "epoch": 3.0,
48
- "eval_f1": 0.8908296943231441,
49
- "eval_loss": 0.3823632299900055,
50
- "eval_runtime": 1.3116,
51
- "eval_samples_per_second": 182.984,
52
- "eval_steps_per_second": 11.437,
53
- "step": 210
54
  },
55
  {
56
  "epoch": 4.0,
57
  "learning_rate": 4.000000000000001e-06,
58
- "loss": 0.0495,
59
- "step": 280
60
  },
61
  {
62
  "epoch": 4.0,
63
- "eval_f1": 0.8818181818181818,
64
- "eval_loss": 0.4416821300983429,
65
- "eval_runtime": 1.3226,
66
- "eval_samples_per_second": 181.456,
67
- "eval_steps_per_second": 11.341,
68
- "step": 280
69
  },
70
  {
71
  "epoch": 5.0,
72
  "learning_rate": 0.0,
73
- "loss": 0.0221,
74
- "step": 350
75
  },
76
  {
77
  "epoch": 5.0,
78
- "eval_f1": 0.8767123287671234,
79
- "eval_loss": 0.504033088684082,
80
- "eval_runtime": 1.3358,
81
- "eval_samples_per_second": 179.671,
82
- "eval_steps_per_second": 11.229,
83
- "step": 350
84
  },
85
  {
86
  "epoch": 5.0,
87
- "step": 350,
88
  "total_flos": 1473421910016000.0,
89
- "train_loss": 0.18657105684280395,
90
- "train_runtime": 93.1154,
91
- "train_samples_per_second": 60.14,
92
- "train_steps_per_second": 3.759
93
  }
94
  ],
95
- "max_steps": 350,
96
  "num_train_epochs": 5,
97
  "total_flos": 1473421910016000.0,
98
  "trial_name": null,
 
1
  {
2
+ "best_metric": 0.8968609865470851,
3
+ "best_model_checkpoint": "models/fake-news-bert-base-spanish-wwm-cased/checkpoint-420",
4
  "epoch": 5.0,
5
+ "global_step": 700,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
10
  {
11
  "epoch": 1.0,
12
  "learning_rate": 1.6000000000000003e-05,
13
+ "loss": 0.5098,
14
+ "step": 140
15
  },
16
  {
17
  "epoch": 1.0,
18
+ "eval_f1": 0.7340425531914895,
19
+ "eval_loss": 0.49776777625083923,
20
+ "eval_runtime": 8.4133,
21
+ "eval_samples_per_second": 28.526,
22
+ "eval_steps_per_second": 3.566,
23
+ "step": 140
24
  },
25
  {
26
  "epoch": 2.0,
27
  "learning_rate": 1.2e-05,
28
+ "loss": 0.2473,
29
+ "step": 280
30
  },
31
  {
32
  "epoch": 2.0,
33
+ "eval_f1": 0.8828828828828829,
34
+ "eval_loss": 0.38877564668655396,
35
+ "eval_runtime": 8.625,
36
+ "eval_samples_per_second": 27.826,
37
+ "eval_steps_per_second": 3.478,
38
+ "step": 280
39
  },
40
  {
41
  "epoch": 3.0,
42
  "learning_rate": 8.000000000000001e-06,
43
+ "loss": 0.0908,
44
+ "step": 420
45
  },
46
  {
47
  "epoch": 3.0,
48
+ "eval_f1": 0.8968609865470851,
49
+ "eval_loss": 0.44203802943229675,
50
+ "eval_runtime": 8.4917,
51
+ "eval_samples_per_second": 28.263,
52
+ "eval_steps_per_second": 3.533,
53
+ "step": 420
54
  },
55
  {
56
  "epoch": 4.0,
57
  "learning_rate": 4.000000000000001e-06,
58
+ "loss": 0.0332,
59
+ "step": 560
60
  },
61
  {
62
  "epoch": 4.0,
63
+ "eval_f1": 0.8796296296296298,
64
+ "eval_loss": 0.5603806376457214,
65
+ "eval_runtime": 8.5449,
66
+ "eval_samples_per_second": 28.087,
67
+ "eval_steps_per_second": 3.511,
68
+ "step": 560
69
  },
70
  {
71
  "epoch": 5.0,
72
  "learning_rate": 0.0,
73
+ "loss": 0.0052,
74
+ "step": 700
75
  },
76
  {
77
  "epoch": 5.0,
78
+ "eval_f1": 0.8956521739130435,
79
+ "eval_loss": 0.5154075622558594,
80
+ "eval_runtime": 8.6086,
81
+ "eval_samples_per_second": 27.879,
82
+ "eval_steps_per_second": 3.485,
83
+ "step": 700
84
  },
85
  {
86
  "epoch": 5.0,
87
+ "step": 700,
88
  "total_flos": 1473421910016000.0,
89
+ "train_loss": 0.17726608804294042,
90
+ "train_runtime": 611.8323,
91
+ "train_samples_per_second": 9.153,
92
+ "train_steps_per_second": 1.144
93
  }
94
  ],
95
+ "max_steps": 700,
96
  "num_train_epochs": 5,
97
  "total_flos": 1473421910016000.0,
98
  "trial_name": null,