mp-02 commited on
Commit
0bc6d99
·
1 Parent(s): 63690ef

End of training

Browse files
all_results.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
- "epoch": 10.0,
3
- "eval_accuracy": 0.8104042259990814,
4
- "eval_f1": 0.8313368471490178,
5
- "eval_loss": 0.5929840803146362,
6
- "eval_precision": 0.7980680772769089,
7
- "eval_recall": 0.8675,
8
- "eval_runtime": 2.4572,
9
  "eval_samples": 54,
10
- "eval_samples_per_second": 21.976,
11
- "eval_steps_per_second": 2.442,
12
  "predict_accuracy": 0.8218373936014088,
13
  "predict_f1": 0.9038133181559477,
14
  "predict_loss": 0.6888472437858582,
@@ -17,9 +17,9 @@
17
  "predict_runtime": 2.0596,
18
  "predict_samples_per_second": 8.74,
19
  "predict_steps_per_second": 0.971,
20
- "train_loss": 0.7810765075683593,
21
- "train_runtime": 94.7164,
22
  "train_samples": 150,
23
- "train_samples_per_second": 15.837,
24
- "train_steps_per_second": 1.584
25
  }
 
1
  {
2
+ "epoch": 26.67,
3
+ "eval_accuracy": 0.8414101975195223,
4
+ "eval_f1": 0.8868156150257795,
5
+ "eval_loss": 0.6016380190849304,
6
+ "eval_precision": 0.8712011577424024,
7
+ "eval_recall": 0.903,
8
+ "eval_runtime": 3.9126,
9
  "eval_samples": 54,
10
+ "eval_samples_per_second": 13.801,
11
+ "eval_steps_per_second": 1.533,
12
  "predict_accuracy": 0.8218373936014088,
13
  "predict_f1": 0.9038133181559477,
14
  "predict_loss": 0.6888472437858582,
 
17
  "predict_runtime": 2.0596,
18
  "predict_samples_per_second": 8.74,
19
  "predict_steps_per_second": 0.971,
20
+ "train_loss": 0.3642783355712891,
21
+ "train_runtime": 422.1629,
22
  "train_samples": 150,
23
+ "train_samples_per_second": 9.475,
24
+ "train_steps_per_second": 0.948
25
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 10.0,
3
- "eval_accuracy": 0.8104042259990814,
4
- "eval_f1": 0.8313368471490178,
5
- "eval_loss": 0.5929840803146362,
6
- "eval_precision": 0.7980680772769089,
7
- "eval_recall": 0.8675,
8
- "eval_runtime": 2.4572,
9
  "eval_samples": 54,
10
- "eval_samples_per_second": 21.976,
11
- "eval_steps_per_second": 2.442
12
  }
 
1
  {
2
+ "epoch": 26.67,
3
+ "eval_accuracy": 0.8414101975195223,
4
+ "eval_f1": 0.8868156150257795,
5
+ "eval_loss": 0.6016380190849304,
6
+ "eval_precision": 0.8712011577424024,
7
+ "eval_recall": 0.903,
8
+ "eval_runtime": 3.9126,
9
  "eval_samples": 54,
10
+ "eval_samples_per_second": 13.801,
11
+ "eval_steps_per_second": 1.533
12
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:841506f6c6c0a194bcb07157467ddcf167f6909db9a6af7260982b8d5abc6e08
3
  size 501420883
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8356f85a16aec70deef67c107e63fd773b89ce3c9d102cc38b7811b85a8d9f28
3
  size 501420883
runs/Aug24_18-22-33_bernini/1724516563.6851988/events.out.tfevents.1724516563.bernini.17841.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1e8940cb1bbb04e933bcbd75e44e4cc408caedcd13138e70fa304b1bb45082d
3
+ size 4671
runs/Aug24_18-22-33_bernini/events.out.tfevents.1724516563.bernini.17841.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01d0a4d477821d2c2b62e7d108caec6511c646418d088d0de0f0489130766f8f
3
+ size 4088
runs/Aug24_18-32-17_bernini/1724517150.2935843/events.out.tfevents.1724517150.bernini.31282.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:973e343088863c70872623627f05d8a41950c931fb81980efcb6a91b8a765e5c
3
+ size 4671
runs/Aug24_18-32-17_bernini/events.out.tfevents.1724517150.bernini.31282.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1b1e582bc38077dcfc75784c4d8d42dd47878f91fc711614faf3c888bf8d959
3
+ size 4088
runs/Aug24_18-33-02_bernini/1724517195.431775/events.out.tfevents.1724517195.bernini.32539.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b52a187b8f6cbaded77baa92e421ad8931132e5a273f12be0b22f7a476851f1
3
+ size 4671
runs/Aug24_18-33-02_bernini/events.out.tfevents.1724517195.bernini.32539.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6444f0a2b4e3bbc6adf7365c5a20f7fac948204dd9ed7c062a949658f87c2b3c
3
+ size 11949
runs/Aug24_18-33-02_bernini/events.out.tfevents.1724517626.bernini.32539.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02f8bb50b51aa38df749470f03a61b8dcd8867a35578004c2577d86726c3b170
3
+ size 512
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 10.0,
3
- "train_loss": 0.7810765075683593,
4
- "train_runtime": 94.7164,
5
  "train_samples": 150,
6
- "train_samples_per_second": 15.837,
7
- "train_steps_per_second": 1.584
8
  }
 
1
  {
2
+ "epoch": 26.67,
3
+ "train_loss": 0.3642783355712891,
4
+ "train_runtime": 422.1629,
5
  "train_samples": 150,
6
+ "train_samples_per_second": 9.475,
7
+ "train_steps_per_second": 0.948
8
  }
trainer_state.json CHANGED
@@ -1,97 +1,217 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 10.0,
5
- "global_step": 150,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 1.67,
12
- "eval_accuracy": 0.6559485530546624,
13
- "eval_f1": 0.48850983179341384,
14
- "eval_loss": 1.2209023237228394,
15
- "eval_precision": 0.46420531292210715,
16
- "eval_recall": 0.5155,
17
- "eval_runtime": 2.3635,
18
- "eval_samples_per_second": 22.848,
19
- "eval_steps_per_second": 2.539,
20
  "step": 25
21
  },
22
  {
23
  "epoch": 3.33,
24
- "eval_accuracy": 0.7619430408819476,
25
- "eval_f1": 0.7535809662539452,
26
- "eval_loss": 0.8171831965446472,
27
- "eval_precision": 0.732420953279849,
28
- "eval_recall": 0.776,
29
- "eval_runtime": 2.3634,
30
- "eval_samples_per_second": 22.849,
31
- "eval_steps_per_second": 2.539,
32
  "step": 50
33
  },
34
  {
35
  "epoch": 5.0,
36
- "eval_accuracy": 0.8125861276986679,
37
- "eval_f1": 0.8145823273780782,
38
- "eval_loss": 0.6125288605690002,
39
- "eval_precision": 0.7875816993464052,
40
- "eval_recall": 0.8435,
41
- "eval_runtime": 2.3662,
42
- "eval_samples_per_second": 22.821,
43
- "eval_steps_per_second": 2.536,
44
  "step": 75
45
  },
46
  {
47
  "epoch": 6.67,
48
- "eval_accuracy": 0.8107487367937529,
49
- "eval_f1": 0.8347784200385356,
50
- "eval_loss": 0.5983520150184631,
51
- "eval_precision": 0.8052973977695167,
52
- "eval_recall": 0.8665,
53
- "eval_runtime": 2.4636,
54
- "eval_samples_per_second": 21.92,
55
- "eval_steps_per_second": 2.436,
56
  "step": 100
57
  },
58
  {
59
  "epoch": 8.33,
60
- "eval_accuracy": 0.8216582452916859,
61
- "eval_f1": 0.8363723608445298,
62
- "eval_loss": 0.5673876404762268,
63
- "eval_precision": 0.8039667896678967,
64
- "eval_recall": 0.8715,
65
- "eval_runtime": 2.3684,
66
- "eval_samples_per_second": 22.8,
67
- "eval_steps_per_second": 2.533,
68
  "step": 125
69
  },
70
  {
71
  "epoch": 10.0,
72
- "eval_accuracy": 0.8104042259990814,
73
- "eval_f1": 0.8313368471490178,
74
- "eval_loss": 0.5929840803146362,
75
- "eval_precision": 0.7980680772769089,
76
- "eval_recall": 0.8675,
77
- "eval_runtime": 2.4505,
78
- "eval_samples_per_second": 22.036,
79
- "eval_steps_per_second": 2.448,
80
  "step": 150
81
  },
82
  {
83
- "epoch": 10.0,
84
- "step": 150,
85
- "total_flos": 395408014848000.0,
86
- "train_loss": 0.7810765075683593,
87
- "train_runtime": 94.7164,
88
- "train_samples_per_second": 15.837,
89
- "train_steps_per_second": 1.584
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
90
  }
91
  ],
92
- "max_steps": 150,
93
- "num_train_epochs": 10,
94
- "total_flos": 395408014848000.0,
95
  "trial_name": null,
96
  "trial_params": null
97
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 26.666666666666668,
5
+ "global_step": 400,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 1.67,
12
+ "eval_accuracy": 0.6659393661001378,
13
+ "eval_f1": 0.5035663338088445,
14
+ "eval_loss": 1.1944581270217896,
15
+ "eval_precision": 0.4800543970988214,
16
+ "eval_recall": 0.5295,
17
+ "eval_runtime": 3.6881,
18
+ "eval_samples_per_second": 14.641,
19
+ "eval_steps_per_second": 1.627,
20
  "step": 25
21
  },
22
  {
23
  "epoch": 3.33,
24
+ "eval_accuracy": 0.7687184198438217,
25
+ "eval_f1": 0.7759615384615385,
26
+ "eval_loss": 0.7770130038261414,
27
+ "eval_precision": 0.7472222222222222,
28
+ "eval_recall": 0.807,
29
+ "eval_runtime": 3.715,
30
+ "eval_samples_per_second": 14.536,
31
+ "eval_steps_per_second": 1.615,
32
  "step": 50
33
  },
34
  {
35
  "epoch": 5.0,
36
+ "eval_accuracy": 0.8118971061093248,
37
+ "eval_f1": 0.8231029482841953,
38
+ "eval_loss": 0.5989910364151001,
39
+ "eval_precision": 0.7965388213283442,
40
+ "eval_recall": 0.8515,
41
+ "eval_runtime": 3.6727,
42
+ "eval_samples_per_second": 14.703,
43
+ "eval_steps_per_second": 1.634,
44
  "step": 75
45
  },
46
  {
47
  "epoch": 6.67,
48
+ "eval_accuracy": 0.7702112999540652,
49
+ "eval_f1": 0.8409471418320977,
50
+ "eval_loss": 0.6813620924949646,
51
+ "eval_precision": 0.8060522696011004,
52
+ "eval_recall": 0.879,
53
+ "eval_runtime": 3.7496,
54
+ "eval_samples_per_second": 14.402,
55
+ "eval_steps_per_second": 1.6,
56
  "step": 100
57
  },
58
  {
59
  "epoch": 8.33,
60
+ "eval_accuracy": 0.8316490583371612,
61
+ "eval_f1": 0.8467469879518073,
62
+ "eval_loss": 0.5391940474510193,
63
+ "eval_precision": 0.8172093023255814,
64
+ "eval_recall": 0.8785,
65
+ "eval_runtime": 3.7027,
66
+ "eval_samples_per_second": 14.584,
67
+ "eval_steps_per_second": 1.62,
68
  "step": 125
69
  },
70
  {
71
  "epoch": 10.0,
72
+ "eval_accuracy": 0.811437758383096,
73
+ "eval_f1": 0.8603297769156159,
74
+ "eval_loss": 0.5438030362129211,
75
+ "eval_precision": 0.835216572504708,
76
+ "eval_recall": 0.887,
77
+ "eval_runtime": 3.7703,
78
+ "eval_samples_per_second": 14.322,
79
+ "eval_steps_per_second": 1.591,
80
  "step": 150
81
  },
82
  {
83
+ "epoch": 11.67,
84
+ "eval_accuracy": 0.838194763435921,
85
+ "eval_f1": 0.8752145133611179,
86
+ "eval_loss": 0.5429797172546387,
87
+ "eval_precision": 0.8585858585858586,
88
+ "eval_recall": 0.8925,
89
+ "eval_runtime": 3.7262,
90
+ "eval_samples_per_second": 14.492,
91
+ "eval_steps_per_second": 1.61,
92
+ "step": 175
93
+ },
94
+ {
95
+ "epoch": 13.33,
96
+ "eval_accuracy": 0.8257923748277446,
97
+ "eval_f1": 0.8691817736403724,
98
+ "eval_loss": 0.5896742939949036,
99
+ "eval_precision": 0.8520653218059558,
100
+ "eval_recall": 0.887,
101
+ "eval_runtime": 3.7744,
102
+ "eval_samples_per_second": 14.307,
103
+ "eval_steps_per_second": 1.59,
104
+ "step": 200
105
+ },
106
+ {
107
+ "epoch": 15.0,
108
+ "eval_accuracy": 0.8430179145613229,
109
+ "eval_f1": 0.8809756097560977,
110
+ "eval_loss": 0.5427059531211853,
111
+ "eval_precision": 0.86,
112
+ "eval_recall": 0.903,
113
+ "eval_runtime": 3.6854,
114
+ "eval_samples_per_second": 14.652,
115
+ "eval_steps_per_second": 1.628,
116
+ "step": 225
117
+ },
118
+ {
119
+ "epoch": 16.67,
120
+ "eval_accuracy": 0.8410656867248507,
121
+ "eval_f1": 0.8822512959763021,
122
+ "eval_loss": 0.5541779398918152,
123
+ "eval_precision": 0.871282301316431,
124
+ "eval_recall": 0.8935,
125
+ "eval_runtime": 3.7194,
126
+ "eval_samples_per_second": 14.518,
127
+ "eval_steps_per_second": 1.613,
128
+ "step": 250
129
+ },
130
+ {
131
+ "epoch": 18.33,
132
+ "eval_accuracy": 0.83210840606339,
133
+ "eval_f1": 0.8821515892420537,
134
+ "eval_loss": 0.6013592481613159,
135
+ "eval_precision": 0.8631578947368421,
136
+ "eval_recall": 0.902,
137
+ "eval_runtime": 3.7675,
138
+ "eval_samples_per_second": 14.333,
139
+ "eval_steps_per_second": 1.593,
140
+ "step": 275
141
+ },
142
+ {
143
+ "epoch": 20.0,
144
+ "eval_accuracy": 0.8365870463941204,
145
+ "eval_f1": 0.8843036109064112,
146
+ "eval_loss": 0.5971384644508362,
147
+ "eval_precision": 0.8691453404152584,
148
+ "eval_recall": 0.9,
149
+ "eval_runtime": 3.72,
150
+ "eval_samples_per_second": 14.516,
151
+ "eval_steps_per_second": 1.613,
152
+ "step": 300
153
+ },
154
+ {
155
+ "epoch": 21.67,
156
+ "eval_accuracy": 0.8313045475424896,
157
+ "eval_f1": 0.8891637803067788,
158
+ "eval_loss": 0.598324716091156,
159
+ "eval_precision": 0.8800195886385896,
160
+ "eval_recall": 0.8985,
161
+ "eval_runtime": 3.78,
162
+ "eval_samples_per_second": 14.286,
163
+ "eval_steps_per_second": 1.587,
164
+ "step": 325
165
+ },
166
+ {
167
+ "epoch": 23.33,
168
+ "eval_accuracy": 0.8414101975195223,
169
+ "eval_f1": 0.8964497041420119,
170
+ "eval_loss": 0.5867139101028442,
171
+ "eval_precision": 0.8842412451361867,
172
+ "eval_recall": 0.909,
173
+ "eval_runtime": 4.0235,
174
+ "eval_samples_per_second": 13.421,
175
+ "eval_steps_per_second": 1.491,
176
+ "step": 350
177
+ },
178
+ {
179
+ "epoch": 25.0,
180
+ "eval_accuracy": 0.8465778594395957,
181
+ "eval_f1": 0.8928835262250677,
182
+ "eval_loss": 0.5947966575622559,
183
+ "eval_precision": 0.8796700630761766,
184
+ "eval_recall": 0.9065,
185
+ "eval_runtime": 3.6989,
186
+ "eval_samples_per_second": 14.599,
187
+ "eval_steps_per_second": 1.622,
188
+ "step": 375
189
+ },
190
+ {
191
+ "epoch": 26.67,
192
+ "eval_accuracy": 0.8414101975195223,
193
+ "eval_f1": 0.8868156150257795,
194
+ "eval_loss": 0.6016380190849304,
195
+ "eval_precision": 0.8712011577424024,
196
+ "eval_recall": 0.903,
197
+ "eval_runtime": 3.6913,
198
+ "eval_samples_per_second": 14.629,
199
+ "eval_steps_per_second": 1.625,
200
+ "step": 400
201
+ },
202
+ {
203
+ "epoch": 26.67,
204
+ "step": 400,
205
+ "total_flos": 1054421372928000.0,
206
+ "train_loss": 0.3642783355712891,
207
+ "train_runtime": 422.1629,
208
+ "train_samples_per_second": 9.475,
209
+ "train_steps_per_second": 0.948
210
  }
211
  ],
212
+ "max_steps": 400,
213
+ "num_train_epochs": 27,
214
+ "total_flos": 1054421372928000.0,
215
  "trial_name": null,
216
  "trial_params": null
217
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:67e671d048c6381947443975ece3fe1b7ffa48552b826dcbe8f9155c1dca716d
3
  size 2927
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8562d79844654a7b5375505088993c1664cd2a797de81729e592c18046e9651
3
  size 2927