synergyai-jaeung commited on
Commit
0aa4735
1 Parent(s): e141828

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,17 +1,17 @@
1
  {
2
- "epoch": 12.0,
3
  "eval_AUC": 0.5,
4
- "eval_F1": 0.47572815533980584,
5
- "eval_Precision": 0.9074074074074074,
6
  "eval_Recall": 1.0,
7
- "eval_accuracy": 0.9074074074074074,
8
- "eval_loss": 0.3346473276615143,
9
- "eval_runtime": 5.474,
10
- "eval_samples_per_second": 59.189,
11
- "eval_steps_per_second": 3.836,
12
- "total_flos": 6.862690600268268e+17,
13
- "train_loss": 0.03526242822408676,
14
- "train_runtime": 251.233,
15
- "train_samples_per_second": 35.25,
16
- "train_steps_per_second": 2.245
17
  }
 
1
  {
2
+ "epoch": 15.0,
3
  "eval_AUC": 0.5,
4
+ "eval_F1": 0.47540983606557374,
5
+ "eval_Precision": 0.90625,
6
  "eval_Recall": 1.0,
7
+ "eval_accuracy": 0.90625,
8
+ "eval_loss": 0.33828961849212646,
9
+ "eval_runtime": 5.0159,
10
+ "eval_samples_per_second": 76.557,
11
+ "eval_steps_per_second": 4.785,
12
+ "total_flos": 1.0112704644704256e+18,
13
+ "train_loss": 0.06119063453240828,
14
+ "train_runtime": 257.3401,
15
+ "train_samples_per_second": 50.711,
16
+ "train_steps_per_second": 3.206
17
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 12.0,
3
  "eval_AUC": 0.5,
4
- "eval_F1": 0.47572815533980584,
5
- "eval_Precision": 0.9074074074074074,
6
  "eval_Recall": 1.0,
7
- "eval_accuracy": 0.9074074074074074,
8
- "eval_loss": 0.3346473276615143,
9
- "eval_runtime": 5.474,
10
- "eval_samples_per_second": 59.189,
11
- "eval_steps_per_second": 3.836
12
  }
 
1
  {
2
+ "epoch": 15.0,
3
  "eval_AUC": 0.5,
4
+ "eval_F1": 0.47540983606557374,
5
+ "eval_Precision": 0.90625,
6
  "eval_Recall": 1.0,
7
+ "eval_accuracy": 0.90625,
8
+ "eval_loss": 0.33828961849212646,
9
+ "eval_runtime": 5.0159,
10
+ "eval_samples_per_second": 76.557,
11
+ "eval_steps_per_second": 4.785
12
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:760373362287b69643cb264294c3cdca3c69105ed8734ed2b2cb181e5b3d2411
3
  size 343223968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4884df1de3f4f54ce6cdaeef73244807d3600eed0a76713c72478f0fb60cd851
3
  size 343223968
runs/May28_16-57-52_RTX3090/events.out.tfevents.1716883342.RTX3090.462376.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:845cd2569a3c1adfb6a17d0eb48ba0c95677eccc9c9fb4a0c5a2ec8f0b20a465
3
+ size 607
runs/May29_01-21-51_RTX3090/events.out.tfevents.1716913322.RTX3090.597255.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00bba5d4ad77fbd27f6c0ab08e3f7f63a5773ce2655780c8eaff95de30eb1ccb
3
+ size 5634
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 12.0,
3
- "total_flos": 6.862690600268268e+17,
4
- "train_loss": 0.03526242822408676,
5
- "train_runtime": 251.233,
6
- "train_samples_per_second": 35.25,
7
- "train_steps_per_second": 2.245
8
  }
 
1
  {
2
+ "epoch": 15.0,
3
+ "total_flos": 1.0112704644704256e+18,
4
+ "train_loss": 0.06119063453240828,
5
+ "train_runtime": 257.3401,
6
+ "train_samples_per_second": 50.711,
7
+ "train_steps_per_second": 3.206
8
  }
trainer_state.json CHANGED
@@ -1,197 +1,236 @@
1
  {
2
- "best_metric": 0.3346473276615143,
3
- "best_model_checkpoint": "google/vit-base-patch16-224-in21k_covid_19_ct_scans/checkpoint-47",
4
- "epoch": 12.0,
5
  "eval_steps": 500,
6
- "global_step": 564,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.02127659574468085,
13
- "grad_norm": 4.243431091308594,
14
- "learning_rate": 0.000199645390070922,
15
- "loss": 0.7767,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 1.0,
20
  "eval_AUC": 0.5,
21
- "eval_F1": 0.47572815533980584,
22
- "eval_Precision": 0.9074074074074074,
23
  "eval_Recall": 1.0,
24
- "eval_accuracy": 0.9074074074074074,
25
- "eval_loss": 0.3346473276615143,
26
- "eval_runtime": 5.5299,
27
- "eval_samples_per_second": 58.591,
28
- "eval_steps_per_second": 3.798,
29
- "step": 47
30
  },
31
  {
32
  "epoch": 2.0,
33
- "eval_AUC": 0.6204081632653061,
34
- "eval_F1": 0.5919028340080972,
35
- "eval_Precision": 0.9311594202898551,
36
- "eval_Recall": 0.8741496598639455,
37
- "eval_accuracy": 0.8271604938271605,
38
- "eval_loss": 0.5513330698013306,
39
- "eval_runtime": 5.5902,
40
- "eval_samples_per_second": 57.959,
41
- "eval_steps_per_second": 3.757,
42
- "step": 94
43
  },
44
  {
45
  "epoch": 3.0,
46
  "eval_AUC": 0.5,
47
- "eval_F1": 0.47572815533980584,
48
- "eval_Precision": 0.9074074074074074,
49
  "eval_Recall": 1.0,
50
- "eval_accuracy": 0.9074074074074074,
51
- "eval_loss": 0.4290040135383606,
52
- "eval_runtime": 5.491,
53
- "eval_samples_per_second": 59.005,
54
- "eval_steps_per_second": 3.824,
55
- "step": 141
56
  },
57
  {
58
  "epoch": 4.0,
59
- "eval_AUC": 0.5965986394557823,
60
- "eval_F1": 0.6365832614322692,
61
- "eval_Precision": 0.9240506329113924,
62
- "eval_Recall": 0.9931972789115646,
63
- "eval_accuracy": 0.9197530864197531,
64
- "eval_loss": 0.433300256729126,
65
- "eval_runtime": 5.3718,
66
- "eval_samples_per_second": 60.315,
67
- "eval_steps_per_second": 3.909,
68
- "step": 188
69
  },
70
  {
71
  "epoch": 5.0,
72
- "eval_AUC": 0.5897959183673469,
73
- "eval_F1": 0.618104667609618,
74
- "eval_Precision": 0.9230769230769231,
75
- "eval_Recall": 0.9795918367346939,
76
- "eval_accuracy": 0.9074074074074074,
77
- "eval_loss": 0.5040868520736694,
78
- "eval_runtime": 5.759,
79
- "eval_samples_per_second": 56.26,
80
- "eval_steps_per_second": 3.646,
81
- "step": 235
82
  },
83
  {
84
  "epoch": 6.0,
85
- "eval_AUC": 0.5948979591836735,
86
- "eval_F1": 0.6316786661614249,
87
- "eval_Precision": 0.9238095238095239,
88
- "eval_Recall": 0.9897959183673469,
89
- "eval_accuracy": 0.9166666666666666,
90
- "eval_loss": 0.4848092496395111,
91
- "eval_runtime": 13.7532,
92
- "eval_samples_per_second": 23.558,
93
- "eval_steps_per_second": 1.527,
94
- "step": 282
95
  },
96
  {
97
  "epoch": 7.0,
98
- "eval_AUC": 0.5965986394557823,
99
- "eval_F1": 0.6365832614322692,
100
- "eval_Precision": 0.9240506329113924,
101
- "eval_Recall": 0.9931972789115646,
102
- "eval_accuracy": 0.9197530864197531,
103
- "eval_loss": 0.48772257566452026,
104
- "eval_runtime": 5.5683,
105
- "eval_samples_per_second": 58.186,
106
- "eval_steps_per_second": 3.771,
107
- "step": 329
108
  },
109
  {
110
  "epoch": 8.0,
111
- "eval_AUC": 0.5965986394557823,
112
- "eval_F1": 0.6365832614322692,
113
- "eval_Precision": 0.9240506329113924,
114
- "eval_Recall": 0.9931972789115646,
115
- "eval_accuracy": 0.9197530864197531,
116
- "eval_loss": 0.49257075786590576,
117
- "eval_runtime": 5.2567,
118
- "eval_samples_per_second": 61.635,
119
- "eval_steps_per_second": 3.995,
120
- "step": 376
121
  },
122
  {
123
  "epoch": 9.0,
124
- "eval_AUC": 0.5965986394557823,
125
- "eval_F1": 0.6365832614322692,
126
- "eval_Precision": 0.9240506329113924,
127
- "eval_Recall": 0.9931972789115646,
128
- "eval_accuracy": 0.9197530864197531,
129
- "eval_loss": 0.49581947922706604,
130
- "eval_runtime": 5.6218,
131
- "eval_samples_per_second": 57.633,
132
- "eval_steps_per_second": 3.735,
133
- "step": 423
134
  },
135
  {
136
- "epoch": 10.0,
137
- "eval_AUC": 0.5965986394557823,
138
- "eval_F1": 0.6365832614322692,
139
- "eval_Precision": 0.9240506329113924,
140
- "eval_Recall": 0.9931972789115646,
141
- "eval_accuracy": 0.9197530864197531,
142
- "eval_loss": 0.4980551600456238,
143
- "eval_runtime": 5.5112,
144
- "eval_samples_per_second": 58.79,
145
- "eval_steps_per_second": 3.81,
146
- "step": 470
147
- },
148
- {
149
- "epoch": 10.638297872340425,
150
- "grad_norm": 0.012480547651648521,
151
- "learning_rate": 2.269503546099291e-05,
152
- "loss": 0.0381,
153
  "step": 500
154
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
155
  {
156
  "epoch": 11.0,
157
- "eval_AUC": 0.5965986394557823,
158
- "eval_F1": 0.6365832614322692,
159
- "eval_Precision": 0.9240506329113924,
160
- "eval_Recall": 0.9931972789115646,
161
- "eval_accuracy": 0.9197530864197531,
162
- "eval_loss": 0.4996081292629242,
163
- "eval_runtime": 5.5015,
164
- "eval_samples_per_second": 58.893,
165
- "eval_steps_per_second": 3.817,
166
- "step": 517
167
  },
168
  {
169
  "epoch": 12.0,
170
- "eval_AUC": 0.5965986394557823,
171
- "eval_F1": 0.6365832614322692,
172
- "eval_Precision": 0.9240506329113924,
173
- "eval_Recall": 0.9931972789115646,
174
- "eval_accuracy": 0.9197530864197531,
175
- "eval_loss": 0.5001835823059082,
176
- "eval_runtime": 5.5423,
177
- "eval_samples_per_second": 58.46,
178
- "eval_steps_per_second": 3.789,
179
- "step": 564
180
  },
181
  {
182
- "epoch": 12.0,
183
- "step": 564,
184
- "total_flos": 6.862690600268268e+17,
185
- "train_loss": 0.03526242822408676,
186
- "train_runtime": 251.233,
187
- "train_samples_per_second": 35.25,
188
- "train_steps_per_second": 2.245
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
189
  }
190
  ],
191
  "logging_steps": 500,
192
- "max_steps": 564,
193
  "num_input_tokens_seen": 0,
194
- "num_train_epochs": 12,
195
  "save_steps": 500,
196
  "stateful_callbacks": {
197
  "TrainerControl": {
@@ -205,7 +244,7 @@
205
  "attributes": {}
206
  }
207
  },
208
- "total_flos": 6.862690600268268e+17,
209
  "train_batch_size": 16,
210
  "trial_name": null,
211
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.33828961849212646,
3
+ "best_model_checkpoint": "google/vit-base-patch16-224-in21k_covid_19_ct_scans/checkpoint-55",
4
+ "epoch": 15.0,
5
  "eval_steps": 500,
6
+ "global_step": 825,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.01818181818181818,
13
+ "grad_norm": 3.793684244155884,
14
+ "learning_rate": 0.00019975757575757576,
15
+ "loss": 0.7218,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 1.0,
20
  "eval_AUC": 0.5,
21
+ "eval_F1": 0.47540983606557374,
22
+ "eval_Precision": 0.90625,
23
  "eval_Recall": 1.0,
24
+ "eval_accuracy": 0.90625,
25
+ "eval_loss": 0.33828961849212646,
26
+ "eval_runtime": 4.7492,
27
+ "eval_samples_per_second": 80.855,
28
+ "eval_steps_per_second": 5.053,
29
+ "step": 55
30
  },
31
  {
32
  "epoch": 2.0,
33
+ "eval_AUC": 0.5,
34
+ "eval_F1": 0.47540983606557374,
35
+ "eval_Precision": 0.90625,
36
+ "eval_Recall": 1.0,
37
+ "eval_accuracy": 0.90625,
38
+ "eval_loss": 0.382261723279953,
39
+ "eval_runtime": 4.831,
40
+ "eval_samples_per_second": 79.486,
41
+ "eval_steps_per_second": 4.968,
42
+ "step": 110
43
  },
44
  {
45
  "epoch": 3.0,
46
  "eval_AUC": 0.5,
47
+ "eval_F1": 0.47540983606557374,
48
+ "eval_Precision": 0.90625,
49
  "eval_Recall": 1.0,
50
+ "eval_accuracy": 0.90625,
51
+ "eval_loss": 0.3956604301929474,
52
+ "eval_runtime": 4.8897,
53
+ "eval_samples_per_second": 78.532,
54
+ "eval_steps_per_second": 4.908,
55
+ "step": 165
56
  },
57
  {
58
  "epoch": 4.0,
59
+ "eval_AUC": 0.5,
60
+ "eval_F1": 0.47540983606557374,
61
+ "eval_Precision": 0.90625,
62
+ "eval_Recall": 1.0,
63
+ "eval_accuracy": 0.90625,
64
+ "eval_loss": 0.44851580262184143,
65
+ "eval_runtime": 4.8632,
66
+ "eval_samples_per_second": 78.96,
67
+ "eval_steps_per_second": 4.935,
68
+ "step": 220
69
  },
70
  {
71
  "epoch": 5.0,
72
+ "eval_AUC": 0.4942528735632184,
73
+ "eval_F1": 0.4725274725274725,
74
+ "eval_Precision": 0.9052631578947369,
75
+ "eval_Recall": 0.9885057471264368,
76
+ "eval_accuracy": 0.8958333333333334,
77
+ "eval_loss": 0.4786018133163452,
78
+ "eval_runtime": 4.8854,
79
+ "eval_samples_per_second": 78.601,
80
+ "eval_steps_per_second": 4.913,
81
+ "step": 275
82
  },
83
  {
84
  "epoch": 6.0,
85
+ "eval_AUC": 0.49712643678160917,
86
+ "eval_F1": 0.473972602739726,
87
+ "eval_Precision": 0.9057591623036649,
88
+ "eval_Recall": 0.9942528735632183,
89
+ "eval_accuracy": 0.9010416666666666,
90
+ "eval_loss": 0.5316488146781921,
91
+ "eval_runtime": 5.3191,
92
+ "eval_samples_per_second": 72.193,
93
+ "eval_steps_per_second": 4.512,
94
+ "step": 330
95
  },
96
  {
97
  "epoch": 7.0,
98
+ "eval_AUC": 0.49712643678160917,
99
+ "eval_F1": 0.473972602739726,
100
+ "eval_Precision": 0.9057591623036649,
101
+ "eval_Recall": 0.9942528735632183,
102
+ "eval_accuracy": 0.9010416666666666,
103
+ "eval_loss": 0.553883969783783,
104
+ "eval_runtime": 4.8592,
105
+ "eval_samples_per_second": 79.026,
106
+ "eval_steps_per_second": 4.939,
107
+ "step": 385
108
  },
109
  {
110
  "epoch": 8.0,
111
+ "eval_AUC": 0.49712643678160917,
112
+ "eval_F1": 0.473972602739726,
113
+ "eval_Precision": 0.9057591623036649,
114
+ "eval_Recall": 0.9942528735632183,
115
+ "eval_accuracy": 0.9010416666666666,
116
+ "eval_loss": 0.5799620747566223,
117
+ "eval_runtime": 4.7649,
118
+ "eval_samples_per_second": 80.589,
119
+ "eval_steps_per_second": 5.037,
120
+ "step": 440
121
  },
122
  {
123
  "epoch": 9.0,
124
+ "eval_AUC": 0.49712643678160917,
125
+ "eval_F1": 0.473972602739726,
126
+ "eval_Precision": 0.9057591623036649,
127
+ "eval_Recall": 0.9942528735632183,
128
+ "eval_accuracy": 0.9010416666666666,
129
+ "eval_loss": 0.5976574420928955,
130
+ "eval_runtime": 4.7034,
131
+ "eval_samples_per_second": 81.644,
132
+ "eval_steps_per_second": 5.103,
133
+ "step": 495
134
  },
135
  {
136
+ "epoch": 9.090909090909092,
137
+ "grad_norm": 0.018258079886436462,
138
+ "learning_rate": 7.878787878787879e-05,
139
+ "loss": 0.0987,
 
 
 
 
 
 
 
 
 
 
 
 
 
140
  "step": 500
141
  },
142
+ {
143
+ "epoch": 10.0,
144
+ "eval_AUC": 0.49712643678160917,
145
+ "eval_F1": 0.473972602739726,
146
+ "eval_Precision": 0.9057591623036649,
147
+ "eval_Recall": 0.9942528735632183,
148
+ "eval_accuracy": 0.9010416666666666,
149
+ "eval_loss": 0.6109693646430969,
150
+ "eval_runtime": 4.7422,
151
+ "eval_samples_per_second": 80.974,
152
+ "eval_steps_per_second": 5.061,
153
+ "step": 550
154
+ },
155
  {
156
  "epoch": 11.0,
157
+ "eval_AUC": 0.49712643678160917,
158
+ "eval_F1": 0.473972602739726,
159
+ "eval_Precision": 0.9057591623036649,
160
+ "eval_Recall": 0.9942528735632183,
161
+ "eval_accuracy": 0.9010416666666666,
162
+ "eval_loss": 0.6211499571800232,
163
+ "eval_runtime": 4.7723,
164
+ "eval_samples_per_second": 80.464,
165
+ "eval_steps_per_second": 5.029,
166
+ "step": 605
167
  },
168
  {
169
  "epoch": 12.0,
170
+ "eval_AUC": 0.49712643678160917,
171
+ "eval_F1": 0.473972602739726,
172
+ "eval_Precision": 0.9057591623036649,
173
+ "eval_Recall": 0.9942528735632183,
174
+ "eval_accuracy": 0.9010416666666666,
175
+ "eval_loss": 0.6287771463394165,
176
+ "eval_runtime": 4.9768,
177
+ "eval_samples_per_second": 77.159,
178
+ "eval_steps_per_second": 4.822,
179
+ "step": 660
180
  },
181
  {
182
+ "epoch": 13.0,
183
+ "eval_AUC": 0.49712643678160917,
184
+ "eval_F1": 0.473972602739726,
185
+ "eval_Precision": 0.9057591623036649,
186
+ "eval_Recall": 0.9942528735632183,
187
+ "eval_accuracy": 0.9010416666666666,
188
+ "eval_loss": 0.6341301798820496,
189
+ "eval_runtime": 4.7422,
190
+ "eval_samples_per_second": 80.974,
191
+ "eval_steps_per_second": 5.061,
192
+ "step": 715
193
+ },
194
+ {
195
+ "epoch": 14.0,
196
+ "eval_AUC": 0.49712643678160917,
197
+ "eval_F1": 0.473972602739726,
198
+ "eval_Precision": 0.9057591623036649,
199
+ "eval_Recall": 0.9942528735632183,
200
+ "eval_accuracy": 0.9010416666666666,
201
+ "eval_loss": 0.6373991370201111,
202
+ "eval_runtime": 4.8768,
203
+ "eval_samples_per_second": 78.74,
204
+ "eval_steps_per_second": 4.921,
205
+ "step": 770
206
+ },
207
+ {
208
+ "epoch": 15.0,
209
+ "eval_AUC": 0.49712643678160917,
210
+ "eval_F1": 0.473972602739726,
211
+ "eval_Precision": 0.9057591623036649,
212
+ "eval_Recall": 0.9942528735632183,
213
+ "eval_accuracy": 0.9010416666666666,
214
+ "eval_loss": 0.6385161280632019,
215
+ "eval_runtime": 4.6939,
216
+ "eval_samples_per_second": 81.808,
217
+ "eval_steps_per_second": 5.113,
218
+ "step": 825
219
+ },
220
+ {
221
+ "epoch": 15.0,
222
+ "step": 825,
223
+ "total_flos": 1.0112704644704256e+18,
224
+ "train_loss": 0.06119063453240828,
225
+ "train_runtime": 257.3401,
226
+ "train_samples_per_second": 50.711,
227
+ "train_steps_per_second": 3.206
228
  }
229
  ],
230
  "logging_steps": 500,
231
+ "max_steps": 825,
232
  "num_input_tokens_seen": 0,
233
+ "num_train_epochs": 15,
234
  "save_steps": 500,
235
  "stateful_callbacks": {
236
  "TrainerControl": {
 
244
  "attributes": {}
245
  }
246
  },
247
+ "total_flos": 1.0112704644704256e+18,
248
  "train_batch_size": 16,
249
  "trial_name": null,
250
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:860ac9cc2700a6acca98170286a713aa05b047089895c0cc3d2037638dcd625e
3
  size 4731
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f570a2a2407a22a4528fa092d0409008681075d1ae3fba96df20687f008eccf6
3
  size 4731