amanvip2 commited on
Commit
b21926b
1 Parent(s): b88f8e1

Model save

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 2.0,
3
  "eval_accuracy": 0.8987341772151899,
4
  "eval_loss": 0.3074355721473694,
5
  "eval_runtime": 3.6489,
6
  "eval_samples_per_second": 64.952,
7
  "eval_steps_per_second": 8.222,
8
- "total_flos": 1.955915347965788e+17,
9
- "train_loss": 0.6030750751495362,
10
- "train_runtime": 187.2986,
11
- "train_samples_per_second": 13.476,
12
- "train_steps_per_second": 0.427
13
  }
 
1
  {
2
+ "epoch": 50.0,
3
  "eval_accuracy": 0.8987341772151899,
4
  "eval_loss": 0.3074355721473694,
5
  "eval_runtime": 3.6489,
6
  "eval_samples_per_second": 64.952,
7
  "eval_steps_per_second": 8.222,
8
+ "total_flos": 4.88978836991447e+18,
9
+ "train_loss": 0.33084768676757814,
10
+ "train_runtime": 1516.8774,
11
+ "train_samples_per_second": 41.599,
12
+ "train_steps_per_second": 1.318
13
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cac0bee8af0a46cf4b0b156fdc1237b3b1f5ab254d318045d0367f9f19e357c
3
  size 343272234
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49998377d5c0f5f5af433d325d06530c50543db0a81e542466e2fdd5d946fce0
3
  size 343272234
runs/May30_19-41-36_6edc4ca7637b/events.out.tfevents.1717098099.6edc4ca7637b.752.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8ae1b392ddcaeefbfbfe5d1a337603fa939db4849ffd1e2ff246059ec424a01
3
+ size 4083
runs/May30_19-42-37_6edc4ca7637b/events.out.tfevents.1717098159.6edc4ca7637b.752.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:438c73e40fddfc4c6fb04a853102d8c6e075dad6eae1eb6075fc1b8b7273f4b7
3
+ size 9135
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.0,
3
- "total_flos": 1.955915347965788e+17,
4
- "train_loss": 0.6030750751495362,
5
- "train_runtime": 187.2986,
6
- "train_samples_per_second": 13.476,
7
- "train_steps_per_second": 0.427
8
  }
 
1
  {
2
+ "epoch": 50.0,
3
+ "total_flos": 4.88978836991447e+18,
4
+ "train_loss": 0.33084768676757814,
5
+ "train_runtime": 1516.8774,
6
+ "train_samples_per_second": 41.599,
7
+ "train_steps_per_second": 1.318
8
  }
trainer_state.json CHANGED
@@ -1,153 +1,363 @@
1
  {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 2.0,
5
- "global_step": 80,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.25,
12
- "eval_accuracy": 0.6455696202531646,
13
- "eval_loss": 0.02083124729651439,
14
- "step": 10,
15
- "train_accuracy": 0.6513470681458003,
16
- "train_loss": 0.02266904281927553
17
  },
18
  {
19
- "epoch": 0.25,
20
- "eval_accuracy": 0.6455696202531646,
21
- "eval_loss": 0.02083124729651439,
22
- "step": 10,
23
- "train_accuracy": 0.6513470681458003,
24
- "train_loss": 0.02266904281927553
25
  },
26
  {
27
- "epoch": 0.5,
28
- "eval_accuracy": 0.7563291139240507,
29
- "eval_loss": 0.01929138223581676,
30
- "step": 20,
31
- "train_accuracy": 0.7234548335974643,
32
- "train_loss": 0.02028798799601674
33
  },
34
  {
35
- "epoch": 0.5,
36
- "eval_accuracy": 0.7563291139240507,
37
- "eval_loss": 0.01929138223581676,
38
- "step": 20,
39
- "train_accuracy": 0.7234548335974643,
40
- "train_loss": 0.02028798799601674
41
  },
42
  {
43
- "epoch": 0.75,
44
- "eval_accuracy": 0.6993670886075949,
45
- "eval_loss": 0.016825428114661686,
46
- "step": 30,
47
- "train_accuracy": 0.7076069730586371,
48
- "train_loss": 0.019086241485955408
49
- },
50
- {
51
- "epoch": 0.75,
52
- "eval_accuracy": 0.6993670886075949,
53
- "eval_loss": 0.016825428114661686,
54
- "step": 30,
55
- "train_accuracy": 0.7076069730586371,
56
- "train_loss": 0.019086241485955408
57
- },
58
- {
59
- "epoch": 1.0,
60
- "eval_accuracy": 0.759493670886076,
61
- "eval_loss": 0.016614416166196896,
62
- "step": 40,
63
- "train_accuracy": 0.7282091917591125,
64
- "train_loss": 0.018539198179819315
65
- },
66
- {
67
- "epoch": 1.0,
68
- "eval_accuracy": 0.759493670886076,
69
- "eval_loss": 0.016614416166196896,
70
- "step": 40,
71
- "train_accuracy": 0.7282091917591125,
72
- "train_loss": 0.018539198179819315
73
- },
74
- {
75
- "epoch": 1.25,
76
- "eval_accuracy": 0.879746835443038,
77
- "eval_loss": 0.012054138545748553,
78
- "step": 50,
79
- "train_accuracy": 0.7955625990491284,
80
- "train_loss": 0.015616062302408052
81
- },
82
- {
83
- "epoch": 1.25,
84
- "eval_accuracy": 0.879746835443038,
85
- "eval_loss": 0.012054138545748553,
86
- "step": 50,
87
- "train_accuracy": 0.7955625990491284,
88
- "train_loss": 0.015616062302408052
89
- },
90
- {
91
- "epoch": 1.5,
92
- "eval_accuracy": 0.8639240506329114,
93
- "eval_loss": 0.01136840549828131,
94
- "step": 60,
95
- "train_accuracy": 0.7963549920760697,
96
- "train_loss": 0.015155698980091113
97
- },
98
- {
99
- "epoch": 1.5,
100
- "eval_accuracy": 0.8639240506329114,
101
- "eval_loss": 0.01136840549828131,
102
- "step": 60,
103
- "train_accuracy": 0.7963549920760697,
104
- "train_loss": 0.015155698980091113
105
- },
106
- {
107
- "epoch": 1.75,
108
- "eval_accuracy": 0.8670886075949367,
109
- "eval_loss": 0.01149832556330705,
110
- "step": 70,
111
- "train_accuracy": 0.786053882725832,
112
- "train_loss": 0.015023683122523047
113
- },
114
- {
115
- "epoch": 1.75,
116
- "eval_accuracy": 0.8670886075949367,
117
- "eval_loss": 0.01149832556330705,
118
- "step": 70,
119
- "train_accuracy": 0.786053882725832,
120
- "train_loss": 0.015023683122523047
121
- },
122
- {
123
- "epoch": 2.0,
124
- "eval_accuracy": 0.879746835443038,
125
- "eval_loss": 0.011085053316400022,
126
- "step": 80,
127
- "train_accuracy": 0.8288431061806656,
128
- "train_loss": 0.01403916791293965
129
- },
130
- {
131
- "epoch": 2.0,
132
- "eval_accuracy": 0.879746835443038,
133
- "eval_loss": 0.011085053316400022,
134
- "step": 80,
135
- "train_accuracy": 0.8288431061806656,
136
- "train_loss": 0.01403916791293965
137
- },
138
- {
139
- "epoch": 2.0,
140
- "step": 80,
141
- "total_flos": 1.955915347965788e+17,
142
- "train_loss": 0.6030750751495362,
143
- "train_runtime": 187.2986,
144
- "train_samples_per_second": 13.476,
145
- "train_steps_per_second": 0.427
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
146
  }
147
  ],
148
- "max_steps": 80,
149
- "num_train_epochs": 2,
150
- "total_flos": 1.955915347965788e+17,
151
  "trial_name": null,
152
  "trial_params": null
153
  }
 
1
  {
2
+ "best_metric": 0.21378879249095917,
3
+ "best_model_checkpoint": "finetuned-breast_cancer_images/checkpoint-1000",
4
+ "epoch": 50.0,
5
+ "global_step": 2000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 2.5,
12
+ "eval_accuracy": 0.8924050632911392,
13
+ "eval_loss": 0.010495646656314028,
14
+ "step": 100,
15
+ "train_accuracy": 0.7979397781299524,
16
+ "train_loss": 0.015081295120734988
17
  },
18
  {
19
+ "epoch": 2.5,
20
+ "eval_accuracy": 0.8924050632911392,
21
+ "eval_loss": 0.010495646656314028,
22
+ "step": 100,
23
+ "train_accuracy": 0.7979397781299524,
24
+ "train_loss": 0.015081295120734988
25
  },
26
  {
27
+ "epoch": 5.0,
28
+ "eval_accuracy": 0.8481012658227848,
29
+ "eval_loss": 0.012960963847139214,
30
+ "step": 200,
31
+ "train_accuracy": 0.7852614896988906,
32
+ "train_loss": 0.015557340427453846
33
  },
34
  {
35
+ "epoch": 5.0,
36
+ "eval_accuracy": 0.8481012658227848,
37
+ "eval_loss": 0.012960963847139214,
38
+ "step": 200,
39
+ "train_accuracy": 0.7852614896988906,
40
+ "train_loss": 0.015557340427453846
41
  },
42
  {
43
+ "epoch": 7.5,
44
+ "eval_accuracy": 0.8892405063291139,
45
+ "eval_loss": 0.010276811881155907,
46
+ "step": 300,
47
+ "train_accuracy": 0.820919175911252,
48
+ "train_loss": 0.013669456005474277
49
+ },
50
+ {
51
+ "epoch": 7.5,
52
+ "eval_accuracy": 0.8892405063291139,
53
+ "eval_loss": 0.010276811881155907,
54
+ "step": 300,
55
+ "train_accuracy": 0.820919175911252,
56
+ "train_loss": 0.013669456005474277
57
+ },
58
+ {
59
+ "epoch": 10.0,
60
+ "eval_accuracy": 0.9050632911392406,
61
+ "eval_loss": 0.008862663909227034,
62
+ "step": 400,
63
+ "train_accuracy": 0.820919175911252,
64
+ "train_loss": 0.012985682336350817
65
+ },
66
+ {
67
+ "epoch": 10.0,
68
+ "eval_accuracy": 0.9050632911392406,
69
+ "eval_loss": 0.008862663909227034,
70
+ "step": 400,
71
+ "train_accuracy": 0.820919175911252,
72
+ "train_loss": 0.012985682336350817
73
+ },
74
+ {
75
+ "epoch": 12.5,
76
+ "eval_accuracy": 0.9050632911392406,
77
+ "eval_loss": 0.008780632840021502,
78
+ "step": 500,
79
+ "train_accuracy": 0.8549920760697306,
80
+ "train_loss": 0.011721825129728877
81
+ },
82
+ {
83
+ "epoch": 12.5,
84
+ "eval_accuracy": 0.9050632911392406,
85
+ "eval_loss": 0.008780632840021502,
86
+ "step": 500,
87
+ "train_accuracy": 0.8549920760697306,
88
+ "train_loss": 0.011721825129728877
89
+ },
90
+ {
91
+ "epoch": 15.0,
92
+ "eval_accuracy": 0.8955696202531646,
93
+ "eval_loss": 0.011701402384080465,
94
+ "step": 600,
95
+ "train_accuracy": 0.8359746434231379,
96
+ "train_loss": 0.012715691998719036
97
+ },
98
+ {
99
+ "epoch": 15.0,
100
+ "eval_accuracy": 0.8955696202531646,
101
+ "eval_loss": 0.011701402384080465,
102
+ "step": 600,
103
+ "train_accuracy": 0.8359746434231379,
104
+ "train_loss": 0.012715691998719036
105
+ },
106
+ {
107
+ "epoch": 17.5,
108
+ "eval_accuracy": 0.9240506329113924,
109
+ "eval_loss": 0.008154087051560607,
110
+ "step": 700,
111
+ "train_accuracy": 0.8692551505546752,
112
+ "train_loss": 0.009956101531224847
113
+ },
114
+ {
115
+ "epoch": 17.5,
116
+ "eval_accuracy": 0.9240506329113924,
117
+ "eval_loss": 0.008154087051560607,
118
+ "step": 700,
119
+ "train_accuracy": 0.8692551505546752,
120
+ "train_loss": 0.009956101531224847
121
+ },
122
+ {
123
+ "epoch": 20.0,
124
+ "eval_accuracy": 0.9367088607594937,
125
+ "eval_loss": 0.007326934451260899,
126
+ "step": 800,
127
+ "train_accuracy": 0.8692551505546752,
128
+ "train_loss": 0.010289413544530914
129
+ },
130
+ {
131
+ "epoch": 20.0,
132
+ "eval_accuracy": 0.9367088607594937,
133
+ "eval_loss": 0.007326934451260899,
134
+ "step": 800,
135
+ "train_accuracy": 0.8692551505546752,
136
+ "train_loss": 0.010289413544530914
137
+ },
138
+ {
139
+ "epoch": 22.5,
140
+ "eval_accuracy": 0.9208860759493671,
141
+ "eval_loss": 0.00792535276541227,
142
+ "step": 900,
143
+ "train_accuracy": 0.8518225039619651,
144
+ "train_loss": 0.010583898344810716
145
+ },
146
+ {
147
+ "epoch": 22.5,
148
+ "eval_accuracy": 0.9208860759493671,
149
+ "eval_loss": 0.00792535276541227,
150
+ "step": 900,
151
+ "train_accuracy": 0.8518225039619651,
152
+ "train_loss": 0.010583898344810716
153
+ },
154
+ {
155
+ "epoch": 25.0,
156
+ "eval_accuracy": 0.9367088607594937,
157
+ "eval_loss": 0.006696073515222797,
158
+ "step": 1000,
159
+ "train_accuracy": 0.8716323296354992,
160
+ "train_loss": 0.00945120326076559
161
+ },
162
+ {
163
+ "epoch": 25.0,
164
+ "eval_accuracy": 0.9367088607594937,
165
+ "eval_loss": 0.006696073515222797,
166
+ "step": 1000,
167
+ "train_accuracy": 0.8716323296354992,
168
+ "train_loss": 0.00945120326076559
169
+ },
170
+ {
171
+ "epoch": 25.0,
172
+ "eval_accuracy": 0.9367088607594937,
173
+ "eval_loss": 0.21378879249095917,
174
+ "eval_runtime": 3.47,
175
+ "eval_samples_per_second": 91.067,
176
+ "eval_steps_per_second": 2.882,
177
+ "step": 1000
178
+ },
179
+ {
180
+ "epoch": 27.5,
181
+ "eval_accuracy": 0.9493670886075949,
182
+ "eval_loss": 0.006863981844928068,
183
+ "step": 1100,
184
+ "train_accuracy": 0.9049128367670365,
185
+ "train_loss": 0.008072348769087044
186
+ },
187
+ {
188
+ "epoch": 27.5,
189
+ "eval_accuracy": 0.9493670886075949,
190
+ "eval_loss": 0.006863981844928068,
191
+ "step": 1100,
192
+ "train_accuracy": 0.9049128367670365,
193
+ "train_loss": 0.008072348769087044
194
+ },
195
+ {
196
+ "epoch": 30.0,
197
+ "eval_accuracy": 0.9493670886075949,
198
+ "eval_loss": 0.007717294818898545,
199
+ "step": 1200,
200
+ "train_accuracy": 0.8763866877971473,
201
+ "train_loss": 0.008911726414779476
202
+ },
203
+ {
204
+ "epoch": 30.0,
205
+ "eval_accuracy": 0.9493670886075949,
206
+ "eval_loss": 0.007717294818898545,
207
+ "step": 1200,
208
+ "train_accuracy": 0.8763866877971473,
209
+ "train_loss": 0.008911726414779476
210
+ },
211
+ {
212
+ "epoch": 32.5,
213
+ "eval_accuracy": 0.9430379746835443,
214
+ "eval_loss": 0.007378749879477899,
215
+ "step": 1300,
216
+ "train_accuracy": 0.8985736925515055,
217
+ "train_loss": 0.007801188312459105
218
+ },
219
+ {
220
+ "epoch": 32.5,
221
+ "eval_accuracy": 0.9430379746835443,
222
+ "eval_loss": 0.007378749879477899,
223
+ "step": 1300,
224
+ "train_accuracy": 0.8985736925515055,
225
+ "train_loss": 0.007801188312459105
226
+ },
227
+ {
228
+ "epoch": 35.0,
229
+ "eval_accuracy": 0.9462025316455697,
230
+ "eval_loss": 0.008579130585104981,
231
+ "step": 1400,
232
+ "train_accuracy": 0.884310618066561,
233
+ "train_loss": 0.00868706993770486
234
+ },
235
+ {
236
+ "epoch": 35.0,
237
+ "eval_accuracy": 0.9462025316455697,
238
+ "eval_loss": 0.008579130585104981,
239
+ "step": 1400,
240
+ "train_accuracy": 0.884310618066561,
241
+ "train_loss": 0.00868706993770486
242
+ },
243
+ {
244
+ "epoch": 37.5,
245
+ "eval_accuracy": 0.9430379746835443,
246
+ "eval_loss": 0.008369221175207367,
247
+ "step": 1500,
248
+ "train_accuracy": 0.8882725832012678,
249
+ "train_loss": 0.007982963917514223
250
+ },
251
+ {
252
+ "epoch": 37.5,
253
+ "eval_accuracy": 0.9430379746835443,
254
+ "eval_loss": 0.008369221175207367,
255
+ "step": 1500,
256
+ "train_accuracy": 0.8882725832012678,
257
+ "train_loss": 0.007982963917514223
258
+ },
259
+ {
260
+ "epoch": 40.0,
261
+ "eval_accuracy": 0.9493670886075949,
262
+ "eval_loss": 0.007007662448560512,
263
+ "step": 1600,
264
+ "train_accuracy": 0.8874801901743264,
265
+ "train_loss": 0.00816094992230698
266
+ },
267
+ {
268
+ "epoch": 40.0,
269
+ "eval_accuracy": 0.9493670886075949,
270
+ "eval_loss": 0.007007662448560512,
271
+ "step": 1600,
272
+ "train_accuracy": 0.8874801901743264,
273
+ "train_loss": 0.00816094992230698
274
+ },
275
+ {
276
+ "epoch": 42.5,
277
+ "eval_accuracy": 0.939873417721519,
278
+ "eval_loss": 0.009104668280652052,
279
+ "step": 1700,
280
+ "train_accuracy": 0.893026941362916,
281
+ "train_loss": 0.0076013513251832095
282
+ },
283
+ {
284
+ "epoch": 42.5,
285
+ "eval_accuracy": 0.939873417721519,
286
+ "eval_loss": 0.009104668280652052,
287
+ "step": 1700,
288
+ "train_accuracy": 0.893026941362916,
289
+ "train_loss": 0.0076013513251832095
290
+ },
291
+ {
292
+ "epoch": 45.0,
293
+ "eval_accuracy": 0.9462025316455697,
294
+ "eval_loss": 0.009510103501143712,
295
+ "step": 1800,
296
+ "train_accuracy": 0.9009508716323297,
297
+ "train_loss": 0.007748251264286117
298
+ },
299
+ {
300
+ "epoch": 45.0,
301
+ "eval_accuracy": 0.9462025316455697,
302
+ "eval_loss": 0.009510103501143712,
303
+ "step": 1800,
304
+ "train_accuracy": 0.9009508716323297,
305
+ "train_loss": 0.007748251264286117
306
+ },
307
+ {
308
+ "epoch": 47.5,
309
+ "eval_accuracy": 0.9525316455696202,
310
+ "eval_loss": 0.008035543746067375,
311
+ "step": 1900,
312
+ "train_accuracy": 0.9136291600633915,
313
+ "train_loss": 0.006531332231314171
314
+ },
315
+ {
316
+ "epoch": 47.5,
317
+ "eval_accuracy": 0.9525316455696202,
318
+ "eval_loss": 0.008035543746067375,
319
+ "step": 1900,
320
+ "train_accuracy": 0.9136291600633915,
321
+ "train_loss": 0.006531332231314171
322
+ },
323
+ {
324
+ "epoch": 50.0,
325
+ "eval_accuracy": 0.9525316455696202,
326
+ "eval_loss": 0.007914679066006895,
327
+ "step": 2000,
328
+ "train_accuracy": 0.9263074484944532,
329
+ "train_loss": 0.006018087188174532
330
+ },
331
+ {
332
+ "epoch": 50.0,
333
+ "eval_accuracy": 0.9525316455696202,
334
+ "eval_loss": 0.007914679066006895,
335
+ "step": 2000,
336
+ "train_accuracy": 0.9263074484944532,
337
+ "train_loss": 0.006018087188174532
338
+ },
339
+ {
340
+ "epoch": 50.0,
341
+ "eval_accuracy": 0.9525316455696202,
342
+ "eval_loss": 0.2529405653476715,
343
+ "eval_runtime": 3.4414,
344
+ "eval_samples_per_second": 91.824,
345
+ "eval_steps_per_second": 2.906,
346
+ "step": 2000
347
+ },
348
+ {
349
+ "epoch": 50.0,
350
+ "step": 2000,
351
+ "total_flos": 4.88978836991447e+18,
352
+ "train_loss": 0.33084768676757814,
353
+ "train_runtime": 1516.8774,
354
+ "train_samples_per_second": 41.599,
355
+ "train_steps_per_second": 1.318
356
  }
357
  ],
358
+ "max_steps": 2000,
359
+ "num_train_epochs": 50,
360
+ "total_flos": 4.88978836991447e+18,
361
  "trial_name": null,
362
  "trial_params": null
363
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f50f8725744fee2d7ed7f926ac8393ac6e100a44aa311df5a83428e418ab1313
3
  size 4408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae9fe06bfc25014d97d851b72c94a69c9588049a36c83c2c6dca94d3e6e63e51
3
  size 4408