synergyai-jaeung commited on
Commit
d217d21
1 Parent(s): db5a405

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "epoch": 8.571428571428571,
3
  "eval_accuracy": 0.9032258064516129,
4
  "eval_auc": 0.5,
5
  "eval_f1": 0.4745762711864407,
@@ -9,9 +9,9 @@
9
  "eval_runtime": 0.6301,
10
  "eval_samples_per_second": 295.208,
11
  "eval_steps_per_second": 4.761,
12
- "total_flos": 1.8691703717363712e+17,
13
- "train_loss": 0.2957582632700602,
14
- "train_runtime": 47.4143,
15
- "train_samples_per_second": 184.754,
16
- "train_steps_per_second": 0.633
17
  }
 
1
  {
2
+ "epoch": 10.0,
3
  "eval_accuracy": 0.9032258064516129,
4
  "eval_auc": 0.5,
5
  "eval_f1": 0.4745762711864407,
 
9
  "eval_runtime": 0.6301,
10
  "eval_samples_per_second": 295.208,
11
  "eval_steps_per_second": 4.761,
12
+ "total_flos": 1.1375723808188006e+18,
13
+ "train_loss": 0.21184425609452384,
14
+ "train_runtime": 168.3293,
15
+ "train_samples_per_second": 52.041,
16
+ "train_steps_per_second": 0.416
17
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d07e7c41d6e3d022c28c3c64002a95b5a168904c992038f6dda631436efb1a4
3
  size 110342832
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ba391ebd43096538016e9666601807201abdf2a330498c741679a39b656df7d
3
  size 110342832
runs/May27_16-05-26_RTX3090/events.out.tfevents.1716793533.RTX3090.11668.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6300258e5aae69528f8891f392f6e6e86f1fb4ba969bbab08b06122104977ad
3
+ size 5787
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 8.571428571428571,
3
- "total_flos": 1.8691703717363712e+17,
4
- "train_loss": 0.2957582632700602,
5
- "train_runtime": 47.4143,
6
- "train_samples_per_second": 184.754,
7
- "train_steps_per_second": 0.633
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "total_flos": 1.1375723808188006e+18,
4
+ "train_loss": 0.21184425609452384,
5
+ "train_runtime": 168.3293,
6
+ "train_samples_per_second": 52.041,
7
+ "train_steps_per_second": 0.416
8
  }
trainer_state.json CHANGED
@@ -1,163 +1,204 @@
1
  {
2
  "best_metric": 0.9032258064516129,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-RCC/checkpoint-3",
4
- "epoch": 8.571428571428571,
5
  "eval_steps": 500,
6
- "global_step": 30,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.8571428571428571,
13
  "eval_accuracy": 0.9032258064516129,
14
  "eval_auc": 0.5,
15
  "eval_f1": 0.4745762711864407,
16
- "eval_loss": 0.3023151159286499,
17
  "eval_precision": 0.9032258064516129,
18
  "eval_recall": 1.0,
19
- "eval_runtime": 0.5993,
20
- "eval_samples_per_second": 310.347,
21
- "eval_steps_per_second": 5.006,
22
- "step": 3
 
 
 
 
 
 
 
23
  },
24
  {
25
  "epoch": 2.0,
26
  "eval_accuracy": 0.9032258064516129,
27
  "eval_auc": 0.5,
28
  "eval_f1": 0.4745762711864407,
29
- "eval_loss": 0.36768200993537903,
30
  "eval_precision": 0.9032258064516129,
31
  "eval_recall": 1.0,
32
- "eval_runtime": 0.6162,
33
- "eval_samples_per_second": 301.832,
34
- "eval_steps_per_second": 4.868,
35
- "step": 7
36
  },
37
  {
38
  "epoch": 2.857142857142857,
39
- "grad_norm": 2.596181631088257,
40
- "learning_rate": 3.7037037037037037e-05,
41
- "loss": 0.4028,
42
- "step": 10
43
  },
44
  {
45
- "epoch": 2.857142857142857,
46
  "eval_accuracy": 0.9032258064516129,
47
  "eval_auc": 0.5,
48
  "eval_f1": 0.4745762711864407,
49
- "eval_loss": 0.32757532596588135,
50
  "eval_precision": 0.9032258064516129,
51
  "eval_recall": 1.0,
52
- "eval_runtime": 0.6008,
53
- "eval_samples_per_second": 309.59,
54
- "eval_steps_per_second": 4.993,
55
- "step": 10
56
  },
57
  {
58
  "epoch": 4.0,
59
  "eval_accuracy": 0.9032258064516129,
60
  "eval_auc": 0.5,
61
  "eval_f1": 0.4745762711864407,
62
- "eval_loss": 0.32863086462020874,
63
  "eval_precision": 0.9032258064516129,
64
  "eval_recall": 1.0,
65
- "eval_runtime": 0.6313,
66
- "eval_samples_per_second": 294.647,
67
- "eval_steps_per_second": 4.752,
68
- "step": 14
 
 
 
 
 
 
 
69
  },
70
  {
71
- "epoch": 4.857142857142857,
72
  "eval_accuracy": 0.9032258064516129,
73
  "eval_auc": 0.5,
74
  "eval_f1": 0.4745762711864407,
75
- "eval_loss": 0.3271201252937317,
76
  "eval_precision": 0.9032258064516129,
77
  "eval_recall": 1.0,
78
- "eval_runtime": 0.6283,
79
- "eval_samples_per_second": 296.051,
80
- "eval_steps_per_second": 4.775,
81
- "step": 17
82
  },
83
  {
84
  "epoch": 5.714285714285714,
85
- "grad_norm": 1.759938359260559,
86
- "learning_rate": 1.8518518518518518e-05,
87
- "loss": 0.2494,
88
- "step": 20
89
  },
90
  {
91
  "epoch": 6.0,
92
  "eval_accuracy": 0.9032258064516129,
93
  "eval_auc": 0.5,
94
  "eval_f1": 0.4745762711864407,
95
- "eval_loss": 0.32589343190193176,
96
  "eval_precision": 0.9032258064516129,
97
  "eval_recall": 1.0,
98
- "eval_runtime": 0.607,
99
- "eval_samples_per_second": 306.423,
100
- "eval_steps_per_second": 4.942,
101
- "step": 21
102
  },
103
  {
104
- "epoch": 6.857142857142857,
105
- "eval_accuracy": 0.9032258064516129,
106
- "eval_auc": 0.5,
107
- "eval_f1": 0.4745762711864407,
108
- "eval_loss": 0.3279106020927429,
109
- "eval_precision": 0.9032258064516129,
110
- "eval_recall": 1.0,
111
- "eval_runtime": 0.6103,
112
- "eval_samples_per_second": 304.771,
113
- "eval_steps_per_second": 4.916,
114
- "step": 24
 
 
 
 
 
 
 
115
  },
116
  {
117
  "epoch": 8.0,
118
- "eval_accuracy": 0.9032258064516129,
119
- "eval_auc": 0.5,
120
- "eval_f1": 0.4745762711864407,
121
- "eval_loss": 0.3266947269439697,
122
- "eval_precision": 0.9032258064516129,
123
- "eval_recall": 1.0,
124
- "eval_runtime": 0.6353,
125
- "eval_samples_per_second": 292.77,
126
- "eval_steps_per_second": 4.722,
127
- "step": 28
128
  },
129
  {
130
  "epoch": 8.571428571428571,
131
- "grad_norm": 2.163374423980713,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
132
  "learning_rate": 0.0,
133
- "loss": 0.2351,
134
- "step": 30
135
  },
136
  {
137
- "epoch": 8.571428571428571,
138
- "eval_accuracy": 0.9032258064516129,
139
- "eval_auc": 0.5,
140
- "eval_f1": 0.4745762711864407,
141
- "eval_loss": 0.32613006234169006,
142
- "eval_precision": 0.9032258064516129,
143
- "eval_recall": 1.0,
144
- "eval_runtime": 0.6179,
145
- "eval_samples_per_second": 301.013,
146
- "eval_steps_per_second": 4.855,
147
- "step": 30
148
  },
149
  {
150
- "epoch": 8.571428571428571,
151
- "step": 30,
152
- "total_flos": 1.8691703717363712e+17,
153
- "train_loss": 0.2957582632700602,
154
- "train_runtime": 47.4143,
155
- "train_samples_per_second": 184.754,
156
- "train_steps_per_second": 0.633
157
  }
158
  ],
159
  "logging_steps": 10,
160
- "max_steps": 30,
161
  "num_input_tokens_seen": 0,
162
  "num_train_epochs": 10,
163
  "save_steps": 500,
@@ -173,8 +214,8 @@
173
  "attributes": {}
174
  }
175
  },
176
- "total_flos": 1.8691703717363712e+17,
177
- "train_batch_size": 64,
178
  "trial_name": null,
179
  "trial_params": null
180
  }
 
1
  {
2
  "best_metric": 0.9032258064516129,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-RCC/checkpoint-7",
4
+ "epoch": 10.0,
5
  "eval_steps": 500,
6
+ "global_step": 70,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 1.0,
13
  "eval_accuracy": 0.9032258064516129,
14
  "eval_auc": 0.5,
15
  "eval_f1": 0.4745762711864407,
16
+ "eval_loss": 0.3295924961566925,
17
  "eval_precision": 0.9032258064516129,
18
  "eval_recall": 1.0,
19
+ "eval_runtime": 1.1464,
20
+ "eval_samples_per_second": 162.249,
21
+ "eval_steps_per_second": 5.234,
22
+ "step": 7
23
+ },
24
+ {
25
+ "epoch": 1.4285714285714286,
26
+ "grad_norm": 0.9726035594940186,
27
+ "learning_rate": 4.761904761904762e-05,
28
+ "loss": 0.4795,
29
+ "step": 10
30
  },
31
  {
32
  "epoch": 2.0,
33
  "eval_accuracy": 0.9032258064516129,
34
  "eval_auc": 0.5,
35
  "eval_f1": 0.4745762711864407,
36
+ "eval_loss": 0.31294792890548706,
37
  "eval_precision": 0.9032258064516129,
38
  "eval_recall": 1.0,
39
+ "eval_runtime": 1.0901,
40
+ "eval_samples_per_second": 170.621,
41
+ "eval_steps_per_second": 5.504,
42
+ "step": 14
43
  },
44
  {
45
  "epoch": 2.857142857142857,
46
+ "grad_norm": 0.6543672680854797,
47
+ "learning_rate": 3.968253968253968e-05,
48
+ "loss": 0.2503,
49
+ "step": 20
50
  },
51
  {
52
+ "epoch": 3.0,
53
  "eval_accuracy": 0.9032258064516129,
54
  "eval_auc": 0.5,
55
  "eval_f1": 0.4745762711864407,
56
+ "eval_loss": 0.31820589303970337,
57
  "eval_precision": 0.9032258064516129,
58
  "eval_recall": 1.0,
59
+ "eval_runtime": 1.1148,
60
+ "eval_samples_per_second": 166.845,
61
+ "eval_steps_per_second": 5.382,
62
+ "step": 21
63
  },
64
  {
65
  "epoch": 4.0,
66
  "eval_accuracy": 0.9032258064516129,
67
  "eval_auc": 0.5,
68
  "eval_f1": 0.4745762711864407,
69
+ "eval_loss": 0.2973339259624481,
70
  "eval_precision": 0.9032258064516129,
71
  "eval_recall": 1.0,
72
+ "eval_runtime": 1.1837,
73
+ "eval_samples_per_second": 157.138,
74
+ "eval_steps_per_second": 5.069,
75
+ "step": 28
76
+ },
77
+ {
78
+ "epoch": 4.285714285714286,
79
+ "grad_norm": 1.603426218032837,
80
+ "learning_rate": 3.1746031746031745e-05,
81
+ "loss": 0.2231,
82
+ "step": 30
83
  },
84
  {
85
+ "epoch": 5.0,
86
  "eval_accuracy": 0.9032258064516129,
87
  "eval_auc": 0.5,
88
  "eval_f1": 0.4745762711864407,
89
+ "eval_loss": 0.3274933993816376,
90
  "eval_precision": 0.9032258064516129,
91
  "eval_recall": 1.0,
92
+ "eval_runtime": 1.1347,
93
+ "eval_samples_per_second": 163.913,
94
+ "eval_steps_per_second": 5.288,
95
+ "step": 35
96
  },
97
  {
98
  "epoch": 5.714285714285714,
99
+ "grad_norm": 1.8515961170196533,
100
+ "learning_rate": 2.380952380952381e-05,
101
+ "loss": 0.1791,
102
+ "step": 40
103
  },
104
  {
105
  "epoch": 6.0,
106
  "eval_accuracy": 0.9032258064516129,
107
  "eval_auc": 0.5,
108
  "eval_f1": 0.4745762711864407,
109
+ "eval_loss": 0.31467387080192566,
110
  "eval_precision": 0.9032258064516129,
111
  "eval_recall": 1.0,
112
+ "eval_runtime": 1.1182,
113
+ "eval_samples_per_second": 166.344,
114
+ "eval_steps_per_second": 5.366,
115
+ "step": 42
116
  },
117
  {
118
+ "epoch": 7.0,
119
+ "eval_accuracy": 0.8978494623655914,
120
+ "eval_auc": 0.5218253968253969,
121
+ "eval_f1": 0.5205535205535206,
122
+ "eval_loss": 0.34014198184013367,
123
+ "eval_precision": 0.907103825136612,
124
+ "eval_recall": 0.9880952380952381,
125
+ "eval_runtime": 1.1252,
126
+ "eval_samples_per_second": 165.308,
127
+ "eval_steps_per_second": 5.333,
128
+ "step": 49
129
+ },
130
+ {
131
+ "epoch": 7.142857142857143,
132
+ "grad_norm": 1.4963322877883911,
133
+ "learning_rate": 1.5873015873015872e-05,
134
+ "loss": 0.1361,
135
+ "step": 50
136
  },
137
  {
138
  "epoch": 8.0,
139
+ "eval_accuracy": 0.7849462365591398,
140
+ "eval_auc": 0.5833333333333335,
141
+ "eval_f1": 0.5528846153846154,
142
+ "eval_loss": 0.3884872794151306,
143
+ "eval_precision": 0.9210526315789473,
144
+ "eval_recall": 0.8333333333333334,
145
+ "eval_runtime": 1.1007,
146
+ "eval_samples_per_second": 168.985,
147
+ "eval_steps_per_second": 5.451,
148
+ "step": 56
149
  },
150
  {
151
  "epoch": 8.571428571428571,
152
+ "grad_norm": 2.6748523712158203,
153
+ "learning_rate": 7.936507936507936e-06,
154
+ "loss": 0.1245,
155
+ "step": 60
156
+ },
157
+ {
158
+ "epoch": 9.0,
159
+ "eval_accuracy": 0.8817204301075269,
160
+ "eval_auc": 0.5873015873015872,
161
+ "eval_f1": 0.6011695906432748,
162
+ "eval_loss": 0.31924736499786377,
163
+ "eval_precision": 0.9195402298850575,
164
+ "eval_recall": 0.9523809523809523,
165
+ "eval_runtime": 1.117,
166
+ "eval_samples_per_second": 166.524,
167
+ "eval_steps_per_second": 5.372,
168
+ "step": 63
169
+ },
170
+ {
171
+ "epoch": 10.0,
172
+ "grad_norm": 3.4235951900482178,
173
  "learning_rate": 0.0,
174
+ "loss": 0.0902,
175
+ "step": 70
176
  },
177
  {
178
+ "epoch": 10.0,
179
+ "eval_accuracy": 0.8225806451612904,
180
+ "eval_auc": 0.6041666666666667,
181
+ "eval_f1": 0.5828746177370031,
182
+ "eval_loss": 0.35260289907455444,
183
+ "eval_precision": 0.9245283018867925,
184
+ "eval_recall": 0.875,
185
+ "eval_runtime": 1.1366,
186
+ "eval_samples_per_second": 163.644,
187
+ "eval_steps_per_second": 5.279,
188
+ "step": 70
189
  },
190
  {
191
+ "epoch": 10.0,
192
+ "step": 70,
193
+ "total_flos": 1.1375723808188006e+18,
194
+ "train_loss": 0.21184425609452384,
195
+ "train_runtime": 168.3293,
196
+ "train_samples_per_second": 52.041,
197
+ "train_steps_per_second": 0.416
198
  }
199
  ],
200
  "logging_steps": 10,
201
+ "max_steps": 70,
202
  "num_input_tokens_seen": 0,
203
  "num_train_epochs": 10,
204
  "save_steps": 500,
 
214
  "attributes": {}
215
  }
216
  },
217
+ "total_flos": 1.1375723808188006e+18,
218
+ "train_batch_size": 32,
219
  "trial_name": null,
220
  "trial_params": null
221
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e96781d201b4962023e2deb6df7f41bd5345729797e7384d64800c6fd5a32f6
3
  size 4731
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1b26dc6bdef927a082d55156b77826a6cdd5096fa7c2241429ac0ddb18ef1bc
3
  size 4731