synergyai-jaeung commited on
Commit
0c1efc0
1 Parent(s): 524e0fb

Training in progress, epoch 0

Browse files
all_results.json CHANGED
@@ -1,8 +1,17 @@
1
  {
2
- "epoch": 2.873239436619718,
3
- "total_flos": 3.244203682433925e+17,
4
- "train_loss": 0.3726242260605681,
5
- "train_runtime": 73.4486,
6
- "train_samples_per_second": 185.517,
7
- "train_steps_per_second": 0.694
 
 
 
 
 
 
 
 
 
8
  }
 
1
  {
2
+ "epoch": 8.571428571428571,
3
+ "eval_accuracy": 0.9032258064516129,
4
+ "eval_auc": 0.5,
5
+ "eval_f1": 0.4745762711864407,
6
+ "eval_loss": 0.33827999234199524,
7
+ "eval_precision": 0.9032258064516129,
8
+ "eval_recall": 1.0,
9
+ "eval_runtime": 1.0789,
10
+ "eval_samples_per_second": 172.394,
11
+ "eval_steps_per_second": 2.781,
12
+ "total_flos": 1.8691703717363712e+17,
13
+ "train_loss": 0.28762030601501465,
14
+ "train_runtime": 70.3105,
15
+ "train_samples_per_second": 124.59,
16
+ "train_steps_per_second": 0.427
17
  }
eval_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.571428571428571,
3
+ "eval_accuracy": 0.9032258064516129,
4
+ "eval_auc": 0.5,
5
+ "eval_f1": 0.4745762711864407,
6
+ "eval_loss": 0.33827999234199524,
7
+ "eval_precision": 0.9032258064516129,
8
+ "eval_recall": 1.0,
9
+ "eval_runtime": 1.0789,
10
+ "eval_samples_per_second": 172.394,
11
+ "eval_steps_per_second": 2.781
12
+ }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2123dddc8cf19a8528f3a439ec0602810e134fa81cdd885aa3dc9a71fd8ed159
3
  size 110342832
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dd2e3b6404034899d709305ce15a3ca43637919f5098d55edd7a72091de6aad
3
  size 110342832
runs/May24_16-50-18_RTX3090/events.out.tfevents.1716537217.RTX3090.3776938.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:900ffa8fe3f58126fd4674b5a512e1472876aa3ebf308aec6d241ac078b2f0fb
3
+ size 597
runs/May24_17-00-00_RTX3090/events.out.tfevents.1716537603.RTX3090.3776938.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fd2774dc57b8778ffc6c016d123a3a75522c5892bb087534f10368efa5ed579
3
+ size 5786
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.873239436619718,
3
- "total_flos": 3.244203682433925e+17,
4
- "train_loss": 0.3726242260605681,
5
- "train_runtime": 73.4486,
6
- "train_samples_per_second": 185.517,
7
- "train_steps_per_second": 0.694
8
  }
 
1
  {
2
+ "epoch": 8.571428571428571,
3
+ "total_flos": 1.8691703717363712e+17,
4
+ "train_loss": 0.28762030601501465,
5
+ "train_runtime": 70.3105,
6
+ "train_samples_per_second": 124.59,
7
+ "train_steps_per_second": 0.427
8
  }
trainer_state.json CHANGED
@@ -1,101 +1,165 @@
1
  {
2
- "best_metric": 0.8162729658792651,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-RCC/checkpoint-51",
4
- "epoch": 2.873239436619718,
5
  "eval_steps": 500,
6
- "global_step": 51,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.5633802816901409,
13
- "grad_norm": 37.96213912963867,
14
- "learning_rate": 4.555555555555556e-05,
15
- "loss": 0.3224,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  "step": 10
17
  },
18
  {
19
- "epoch": 0.9577464788732394,
20
- "eval_accuracy": 0.6482939632545932,
21
- "eval_auc": 0.5379230308475591,
22
- "eval_f1": 0.5145158376204106,
23
- "eval_loss": 0.6836453080177307,
24
- "eval_precision": 0.8498098859315589,
25
- "eval_recall": 0.7028301886792453,
26
- "eval_runtime": 2.677,
27
- "eval_samples_per_second": 284.647,
28
- "eval_steps_per_second": 4.483,
 
 
 
 
 
 
 
 
 
 
 
 
 
29
  "step": 17
30
  },
31
  {
32
- "epoch": 1.1267605633802817,
33
- "grad_norm": 6.688726902008057,
34
- "learning_rate": 3.444444444444445e-05,
35
- "loss": 0.3482,
36
  "step": 20
37
  },
38
  {
39
- "epoch": 1.6901408450704225,
40
- "grad_norm": 3.9382684230804443,
41
- "learning_rate": 2.3333333333333336e-05,
42
- "loss": 0.3829,
43
- "step": 30
 
 
 
 
 
 
44
  },
45
  {
46
- "epoch": 1.971830985915493,
47
- "eval_accuracy": 0.8044619422572179,
48
- "eval_auc": 0.5201033243486074,
49
- "eval_f1": 0.5142198243219538,
50
- "eval_loss": 0.48597800731658936,
51
- "eval_precision": 0.8405594405594405,
52
- "eval_recall": 0.9449685534591195,
53
- "eval_runtime": 2.6435,
54
- "eval_samples_per_second": 288.253,
55
- "eval_steps_per_second": 4.539,
56
- "step": 35
57
  },
58
  {
59
- "epoch": 2.2535211267605635,
60
- "grad_norm": 3.417764186859131,
61
- "learning_rate": 1.2222222222222222e-05,
62
- "loss": 0.405,
63
- "step": 40
 
 
 
 
 
 
64
  },
65
  {
66
- "epoch": 2.816901408450704,
67
- "grad_norm": 4.870389461517334,
68
- "learning_rate": 1.1111111111111112e-06,
69
- "loss": 0.4052,
70
- "step": 50
71
  },
72
  {
73
- "epoch": 2.873239436619718,
74
- "eval_accuracy": 0.8162729658792651,
75
- "eval_auc": 0.5208146151542379,
76
- "eval_f1": 0.5111803519061584,
77
- "eval_loss": 0.48757827281951904,
78
- "eval_precision": 0.8406593406593407,
79
- "eval_recall": 0.9622641509433962,
80
- "eval_runtime": 2.7101,
81
- "eval_samples_per_second": 281.168,
82
- "eval_steps_per_second": 4.428,
83
- "step": 51
84
  },
85
  {
86
- "epoch": 2.873239436619718,
87
- "step": 51,
88
- "total_flos": 3.244203682433925e+17,
89
- "train_loss": 0.3726242260605681,
90
- "train_runtime": 73.4486,
91
- "train_samples_per_second": 185.517,
92
- "train_steps_per_second": 0.694
93
  }
94
  ],
95
  "logging_steps": 10,
96
- "max_steps": 51,
97
  "num_input_tokens_seen": 0,
98
- "num_train_epochs": 3,
99
  "save_steps": 500,
100
  "stateful_callbacks": {
101
  "TrainerControl": {
@@ -109,7 +173,7 @@
109
  "attributes": {}
110
  }
111
  },
112
- "total_flos": 3.244203682433925e+17,
113
  "train_batch_size": 64,
114
  "trial_name": null,
115
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.9032258064516129,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-RCC/checkpoint-3",
4
+ "epoch": 8.571428571428571,
5
  "eval_steps": 500,
6
+ "global_step": 30,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.8571428571428571,
13
+ "eval_accuracy": 0.9032258064516129,
14
+ "eval_auc": 0.5,
15
+ "eval_f1": 0.4745762711864407,
16
+ "eval_loss": 0.33827999234199524,
17
+ "eval_precision": 0.9032258064516129,
18
+ "eval_recall": 1.0,
19
+ "eval_runtime": 1.0242,
20
+ "eval_samples_per_second": 181.602,
21
+ "eval_steps_per_second": 2.929,
22
+ "step": 3
23
+ },
24
+ {
25
+ "epoch": 2.0,
26
+ "eval_accuracy": 0.9032258064516129,
27
+ "eval_auc": 0.5,
28
+ "eval_f1": 0.4745762711864407,
29
+ "eval_loss": 0.3653673529624939,
30
+ "eval_precision": 0.9032258064516129,
31
+ "eval_recall": 1.0,
32
+ "eval_runtime": 1.0375,
33
+ "eval_samples_per_second": 179.274,
34
+ "eval_steps_per_second": 2.892,
35
+ "step": 7
36
+ },
37
+ {
38
+ "epoch": 2.857142857142857,
39
+ "grad_norm": 4.537749767303467,
40
+ "learning_rate": 3.7037037037037037e-05,
41
+ "loss": 0.3833,
42
+ "step": 10
43
+ },
44
+ {
45
+ "epoch": 2.857142857142857,
46
+ "eval_accuracy": 0.9032258064516129,
47
+ "eval_auc": 0.5,
48
+ "eval_f1": 0.4745762711864407,
49
+ "eval_loss": 0.3421719968318939,
50
+ "eval_precision": 0.9032258064516129,
51
+ "eval_recall": 1.0,
52
+ "eval_runtime": 1.0114,
53
+ "eval_samples_per_second": 183.911,
54
+ "eval_steps_per_second": 2.966,
55
  "step": 10
56
  },
57
  {
58
+ "epoch": 4.0,
59
+ "eval_accuracy": 0.9032258064516129,
60
+ "eval_auc": 0.5,
61
+ "eval_f1": 0.4745762711864407,
62
+ "eval_loss": 0.3555563986301422,
63
+ "eval_precision": 0.9032258064516129,
64
+ "eval_recall": 1.0,
65
+ "eval_runtime": 1.0242,
66
+ "eval_samples_per_second": 181.606,
67
+ "eval_steps_per_second": 2.929,
68
+ "step": 14
69
+ },
70
+ {
71
+ "epoch": 4.857142857142857,
72
+ "eval_accuracy": 0.9032258064516129,
73
+ "eval_auc": 0.5,
74
+ "eval_f1": 0.4745762711864407,
75
+ "eval_loss": 0.3424948453903198,
76
+ "eval_precision": 0.9032258064516129,
77
+ "eval_recall": 1.0,
78
+ "eval_runtime": 1.0046,
79
+ "eval_samples_per_second": 185.14,
80
+ "eval_steps_per_second": 2.986,
81
  "step": 17
82
  },
83
  {
84
+ "epoch": 5.714285714285714,
85
+ "grad_norm": 1.4052001237869263,
86
+ "learning_rate": 1.8518518518518518e-05,
87
+ "loss": 0.2492,
88
  "step": 20
89
  },
90
  {
91
+ "epoch": 6.0,
92
+ "eval_accuracy": 0.9032258064516129,
93
+ "eval_auc": 0.5,
94
+ "eval_f1": 0.4745762711864407,
95
+ "eval_loss": 0.3400775194168091,
96
+ "eval_precision": 0.9032258064516129,
97
+ "eval_recall": 1.0,
98
+ "eval_runtime": 1.0288,
99
+ "eval_samples_per_second": 180.792,
100
+ "eval_steps_per_second": 2.916,
101
+ "step": 21
102
  },
103
  {
104
+ "epoch": 6.857142857142857,
105
+ "eval_accuracy": 0.9032258064516129,
106
+ "eval_auc": 0.5,
107
+ "eval_f1": 0.4745762711864407,
108
+ "eval_loss": 0.35429030656814575,
109
+ "eval_precision": 0.9032258064516129,
110
+ "eval_recall": 1.0,
111
+ "eval_runtime": 0.999,
112
+ "eval_samples_per_second": 186.195,
113
+ "eval_steps_per_second": 3.003,
114
+ "step": 24
115
  },
116
  {
117
+ "epoch": 8.0,
118
+ "eval_accuracy": 0.9032258064516129,
119
+ "eval_auc": 0.5,
120
+ "eval_f1": 0.4745762711864407,
121
+ "eval_loss": 0.3571774363517761,
122
+ "eval_precision": 0.9032258064516129,
123
+ "eval_recall": 1.0,
124
+ "eval_runtime": 1.0317,
125
+ "eval_samples_per_second": 180.286,
126
+ "eval_steps_per_second": 2.908,
127
+ "step": 28
128
  },
129
  {
130
+ "epoch": 8.571428571428571,
131
+ "grad_norm": 1.283613920211792,
132
+ "learning_rate": 0.0,
133
+ "loss": 0.2304,
134
+ "step": 30
135
  },
136
  {
137
+ "epoch": 8.571428571428571,
138
+ "eval_accuracy": 0.9032258064516129,
139
+ "eval_auc": 0.5,
140
+ "eval_f1": 0.4745762711864407,
141
+ "eval_loss": 0.35649099946022034,
142
+ "eval_precision": 0.9032258064516129,
143
+ "eval_recall": 1.0,
144
+ "eval_runtime": 1.006,
145
+ "eval_samples_per_second": 184.89,
146
+ "eval_steps_per_second": 2.982,
147
+ "step": 30
148
  },
149
  {
150
+ "epoch": 8.571428571428571,
151
+ "step": 30,
152
+ "total_flos": 1.8691703717363712e+17,
153
+ "train_loss": 0.28762030601501465,
154
+ "train_runtime": 70.3105,
155
+ "train_samples_per_second": 124.59,
156
+ "train_steps_per_second": 0.427
157
  }
158
  ],
159
  "logging_steps": 10,
160
+ "max_steps": 30,
161
  "num_input_tokens_seen": 0,
162
+ "num_train_epochs": 10,
163
  "save_steps": 500,
164
  "stateful_callbacks": {
165
  "TrainerControl": {
 
173
  "attributes": {}
174
  }
175
  },
176
+ "total_flos": 1.8691703717363712e+17,
177
  "train_batch_size": 64,
178
  "trial_name": null,
179
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b51c58804bde30d77029103e316923288b7e152ac500fbd62212b7d62e90453
3
  size 4731
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d4c5476f8f49bfc14a67ca98ff73785fd0e5765eba1ff25ad649cd22bc6aaea
3
  size 4731