moock commited on
Commit
a8d3f95
1 Parent(s): 52e2f94

End of training

Browse files
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
- value: 0.7953020134228188
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,20 +32,20 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [microsoft/swinv2-tiny-patch4-window8-256](https://huggingface.co/microsoft/swinv2-tiny-patch4-window8-256) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.5942
36
- - Accuracy: 0.7953
37
 
38
  ## Model description
39
 
40
- Predict Expansion Grade - Gardner Score from an embryo image
41
 
42
  ## Intended uses & limitations
43
 
44
- More information will be provided
45
 
46
  ## Training and evaluation data
47
 
48
- More information needed will be provided
49
 
50
  ## Training procedure
51
 
@@ -67,16 +67,16 @@ The following hyperparameters were used during training:
67
 
68
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
69
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
70
- | 1.6004 | 0.97 | 14 | 1.4012 | 0.5463 |
71
- | 1.4099 | 2.0 | 29 | 1.0249 | 0.5463 |
72
- | 1.1043 | 2.97 | 43 | 0.9695 | 0.6732 |
73
- | 1.0028 | 4.0 | 58 | 0.8659 | 0.6585 |
74
- | 0.8915 | 4.97 | 72 | 0.7728 | 0.7317 |
75
- | 0.8824 | 6.0 | 87 | 0.7238 | 0.7220 |
76
- | 0.8286 | 6.97 | 101 | 0.7220 | 0.7220 |
77
- | 0.8274 | 8.0 | 116 | 0.7376 | 0.6976 |
78
- | 0.7765 | 8.97 | 130 | 0.7117 | 0.7366 |
79
- | 0.7633 | 9.66 | 140 | 0.7079 | 0.7366 |
80
 
81
 
82
  ### Framework versions
 
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.8154362416107382
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [microsoft/swinv2-tiny-patch4-window8-256](https://huggingface.co/microsoft/swinv2-tiny-patch4-window8-256) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.6445
36
+ - Accuracy: 0.8154
37
 
38
  ## Model description
39
 
40
+ More information needed
41
 
42
  ## Intended uses & limitations
43
 
44
+ More information needed
45
 
46
  ## Training and evaluation data
47
 
48
+ More information needed
49
 
50
  ## Training procedure
51
 
 
67
 
68
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
69
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
70
+ | 1.6002 | 0.97 | 14 | 1.4558 | 0.5024 |
71
+ | 1.4093 | 2.0 | 29 | 1.2320 | 0.5024 |
72
+ | 1.1068 | 2.97 | 43 | 1.0740 | 0.5951 |
73
+ | 0.9988 | 4.0 | 58 | 0.9967 | 0.6049 |
74
+ | 0.9099 | 4.97 | 72 | 0.9248 | 0.6 |
75
+ | 0.8674 | 6.0 | 87 | 0.8766 | 0.6780 |
76
+ | 0.8638 | 6.97 | 101 | 0.8656 | 0.6732 |
77
+ | 0.833 | 8.0 | 116 | 0.8395 | 0.6732 |
78
+ | 0.8211 | 8.97 | 130 | 0.8204 | 0.6927 |
79
+ | 0.8236 | 9.66 | 140 | 0.8204 | 0.6780 |
80
 
81
 
82
  ### Framework versions
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 9.66,
3
- "eval_accuracy": 0.7953020134228188,
4
- "eval_loss": 0.5942178964614868,
5
- "eval_runtime": 12.097,
6
- "eval_samples_per_second": 24.634,
7
- "eval_steps_per_second": 0.827,
8
- "train_loss": 0.9881165368216378,
9
- "train_runtime": 1025.6442,
10
- "train_samples_per_second": 17.93,
11
- "train_steps_per_second": 0.136
12
  }
 
1
  {
2
  "epoch": 9.66,
3
+ "eval_accuracy": 0.8154362416107382,
4
+ "eval_loss": 0.6445475816726685,
5
+ "eval_runtime": 10.3295,
6
+ "eval_samples_per_second": 28.849,
7
+ "eval_steps_per_second": 0.968,
8
+ "train_loss": 1.0145302023206437,
9
+ "train_runtime": 896.6945,
10
+ "train_samples_per_second": 20.509,
11
+ "train_steps_per_second": 0.156
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 9.66,
3
- "eval_accuracy": 0.7953020134228188,
4
- "eval_loss": 0.5942178964614868,
5
- "eval_runtime": 12.097,
6
- "eval_samples_per_second": 24.634,
7
- "eval_steps_per_second": 0.827
8
  }
 
1
  {
2
  "epoch": 9.66,
3
+ "eval_accuracy": 0.8154362416107382,
4
+ "eval_loss": 0.6445475816726685,
5
+ "eval_runtime": 10.3295,
6
+ "eval_samples_per_second": 28.849,
7
+ "eval_steps_per_second": 0.968
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b84f52166f9698bfa19378546856697dc85b2c450c8f3451dc214fc69bf72d4b
3
  size 110359372
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8780f92caaadaf679a8727782284d64e7aa4f2cb477acc21b6624ba44457c5be
3
  size 110359372
runs/Dec27_20-34-04_MacBook-Pro-de-Max-2.local/events.out.tfevents.1703705661.MacBook-Pro-de-Max-2.local.31343.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17acf8ed3bafcf6454846910a222c3a7dbf4d0fe91346c3b33161818b1d52a50
3
+ size 10529
runs/Dec27_20-34-04_MacBook-Pro-de-Max-2.local/events.out.tfevents.1703706562.MacBook-Pro-de-Max-2.local.31343.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:974b8511e863c985ecfd8a02ca2c8ba9e572ebcaa81131b7ed2e7603442a0f02
3
+ size 734
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 9.66,
3
- "train_loss": 0.9881165368216378,
4
- "train_runtime": 1025.6442,
5
- "train_samples_per_second": 17.93,
6
- "train_steps_per_second": 0.136
7
  }
 
1
  {
2
  "epoch": 9.66,
3
+ "train_loss": 1.0145302023206437,
4
+ "train_runtime": 896.6945,
5
+ "train_samples_per_second": 20.509,
6
+ "train_steps_per_second": 0.156
7
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.7365853658536585,
3
  "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-finetuned-gardner-exp-max/checkpoint-130",
4
  "epoch": 9.655172413793103,
5
  "eval_steps": 500,
@@ -11,185 +11,185 @@
11
  {
12
  "epoch": 0.69,
13
  "learning_rate": 3.571428571428572e-05,
14
- "loss": 1.6004,
15
  "step": 10
16
  },
17
  {
18
  "epoch": 0.97,
19
- "eval_accuracy": 0.5463414634146342,
20
- "eval_loss": 1.401221752166748,
21
- "eval_runtime": 10.6657,
22
- "eval_samples_per_second": 19.22,
23
- "eval_steps_per_second": 0.656,
24
  "step": 14
25
  },
26
  {
27
  "epoch": 1.38,
28
  "learning_rate": 4.761904761904762e-05,
29
- "loss": 1.4099,
30
  "step": 20
31
  },
32
  {
33
  "epoch": 2.0,
34
- "eval_accuracy": 0.5463414634146342,
35
- "eval_loss": 1.024906039237976,
36
- "eval_runtime": 3.9358,
37
- "eval_samples_per_second": 52.086,
38
- "eval_steps_per_second": 1.779,
39
  "step": 29
40
  },
41
  {
42
  "epoch": 2.07,
43
  "learning_rate": 4.3650793650793655e-05,
44
- "loss": 1.1287,
45
  "step": 30
46
  },
47
  {
48
  "epoch": 2.76,
49
  "learning_rate": 3.968253968253968e-05,
50
- "loss": 1.1043,
51
  "step": 40
52
  },
53
  {
54
  "epoch": 2.97,
55
- "eval_accuracy": 0.6731707317073171,
56
- "eval_loss": 0.9695160388946533,
57
- "eval_runtime": 4.1803,
58
- "eval_samples_per_second": 49.039,
59
- "eval_steps_per_second": 1.675,
60
  "step": 43
61
  },
62
  {
63
  "epoch": 3.45,
64
  "learning_rate": 3.571428571428572e-05,
65
- "loss": 1.0028,
66
  "step": 50
67
  },
68
  {
69
  "epoch": 4.0,
70
- "eval_accuracy": 0.6585365853658537,
71
- "eval_loss": 0.8658934235572815,
72
- "eval_runtime": 4.0107,
73
- "eval_samples_per_second": 51.114,
74
- "eval_steps_per_second": 1.745,
75
  "step": 58
76
  },
77
  {
78
  "epoch": 4.14,
79
  "learning_rate": 3.1746031746031745e-05,
80
- "loss": 0.9609,
81
  "step": 60
82
  },
83
  {
84
  "epoch": 4.83,
85
  "learning_rate": 2.777777777777778e-05,
86
- "loss": 0.8915,
87
  "step": 70
88
  },
89
  {
90
  "epoch": 4.97,
91
- "eval_accuracy": 0.7317073170731707,
92
- "eval_loss": 0.7727790474891663,
93
- "eval_runtime": 4.0395,
94
- "eval_samples_per_second": 50.748,
95
- "eval_steps_per_second": 1.733,
96
  "step": 72
97
  },
98
  {
99
  "epoch": 5.52,
100
  "learning_rate": 2.380952380952381e-05,
101
- "loss": 0.8824,
102
  "step": 80
103
  },
104
  {
105
  "epoch": 6.0,
106
- "eval_accuracy": 0.7219512195121951,
107
- "eval_loss": 0.7237768173217773,
108
- "eval_runtime": 3.9086,
109
- "eval_samples_per_second": 52.449,
110
- "eval_steps_per_second": 1.791,
111
  "step": 87
112
  },
113
  {
114
  "epoch": 6.21,
115
  "learning_rate": 1.984126984126984e-05,
116
- "loss": 0.8629,
117
  "step": 90
118
  },
119
  {
120
  "epoch": 6.9,
121
  "learning_rate": 1.5873015873015872e-05,
122
- "loss": 0.8286,
123
  "step": 100
124
  },
125
  {
126
  "epoch": 6.97,
127
- "eval_accuracy": 0.7219512195121951,
128
- "eval_loss": 0.7219818830490112,
129
- "eval_runtime": 3.9131,
130
- "eval_samples_per_second": 52.389,
131
- "eval_steps_per_second": 1.789,
132
  "step": 101
133
  },
134
  {
135
  "epoch": 7.59,
136
  "learning_rate": 1.1904761904761905e-05,
137
- "loss": 0.8274,
138
  "step": 110
139
  },
140
  {
141
  "epoch": 8.0,
142
- "eval_accuracy": 0.697560975609756,
143
- "eval_loss": 0.7375687956809998,
144
- "eval_runtime": 3.8911,
145
- "eval_samples_per_second": 52.685,
146
- "eval_steps_per_second": 1.799,
147
  "step": 116
148
  },
149
  {
150
  "epoch": 8.28,
151
  "learning_rate": 7.936507936507936e-06,
152
- "loss": 0.794,
153
  "step": 120
154
  },
155
  {
156
  "epoch": 8.97,
157
  "learning_rate": 3.968253968253968e-06,
158
- "loss": 0.7765,
159
  "step": 130
160
  },
161
  {
162
  "epoch": 8.97,
163
- "eval_accuracy": 0.7365853658536585,
164
- "eval_loss": 0.7116620540618896,
165
- "eval_runtime": 3.9546,
166
- "eval_samples_per_second": 51.839,
167
- "eval_steps_per_second": 1.77,
168
  "step": 130
169
  },
170
  {
171
  "epoch": 9.66,
172
  "learning_rate": 0.0,
173
- "loss": 0.7633,
174
  "step": 140
175
  },
176
  {
177
  "epoch": 9.66,
178
- "eval_accuracy": 0.7365853658536585,
179
- "eval_loss": 0.7078527212142944,
180
- "eval_runtime": 4.1225,
181
- "eval_samples_per_second": 49.727,
182
- "eval_steps_per_second": 1.698,
183
  "step": 140
184
  },
185
  {
186
  "epoch": 9.66,
187
  "step": 140,
188
  "total_flos": 5.78085766574506e+17,
189
- "train_loss": 0.9881165368216378,
190
- "train_runtime": 1025.6442,
191
- "train_samples_per_second": 17.93,
192
- "train_steps_per_second": 0.136
193
  }
194
  ],
195
  "logging_steps": 10,
 
1
  {
2
+ "best_metric": 0.6926829268292682,
3
  "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-finetuned-gardner-exp-max/checkpoint-130",
4
  "epoch": 9.655172413793103,
5
  "eval_steps": 500,
 
11
  {
12
  "epoch": 0.69,
13
  "learning_rate": 3.571428571428572e-05,
14
+ "loss": 1.6002,
15
  "step": 10
16
  },
17
  {
18
  "epoch": 0.97,
19
+ "eval_accuracy": 0.5024390243902439,
20
+ "eval_loss": 1.4557533264160156,
21
+ "eval_runtime": 10.833,
22
+ "eval_samples_per_second": 18.924,
23
+ "eval_steps_per_second": 0.646,
24
  "step": 14
25
  },
26
  {
27
  "epoch": 1.38,
28
  "learning_rate": 4.761904761904762e-05,
29
+ "loss": 1.4093,
30
  "step": 20
31
  },
32
  {
33
  "epoch": 2.0,
34
+ "eval_accuracy": 0.5024390243902439,
35
+ "eval_loss": 1.2319719791412354,
36
+ "eval_runtime": 4.0581,
37
+ "eval_samples_per_second": 50.516,
38
+ "eval_steps_per_second": 1.725,
39
  "step": 29
40
  },
41
  {
42
  "epoch": 2.07,
43
  "learning_rate": 4.3650793650793655e-05,
44
+ "loss": 1.232,
45
  "step": 30
46
  },
47
  {
48
  "epoch": 2.76,
49
  "learning_rate": 3.968253968253968e-05,
50
+ "loss": 1.1068,
51
  "step": 40
52
  },
53
  {
54
  "epoch": 2.97,
55
+ "eval_accuracy": 0.5951219512195122,
56
+ "eval_loss": 1.0739854574203491,
57
+ "eval_runtime": 4.0516,
58
+ "eval_samples_per_second": 50.598,
59
+ "eval_steps_per_second": 1.728,
60
  "step": 43
61
  },
62
  {
63
  "epoch": 3.45,
64
  "learning_rate": 3.571428571428572e-05,
65
+ "loss": 0.9988,
66
  "step": 50
67
  },
68
  {
69
  "epoch": 4.0,
70
+ "eval_accuracy": 0.6048780487804878,
71
+ "eval_loss": 0.9966912865638733,
72
+ "eval_runtime": 3.5184,
73
+ "eval_samples_per_second": 58.266,
74
+ "eval_steps_per_second": 1.99,
75
  "step": 58
76
  },
77
  {
78
  "epoch": 4.14,
79
  "learning_rate": 3.1746031746031745e-05,
80
+ "loss": 1.0171,
81
  "step": 60
82
  },
83
  {
84
  "epoch": 4.83,
85
  "learning_rate": 2.777777777777778e-05,
86
+ "loss": 0.9099,
87
  "step": 70
88
  },
89
  {
90
  "epoch": 4.97,
91
+ "eval_accuracy": 0.6,
92
+ "eval_loss": 0.9247760772705078,
93
+ "eval_runtime": 3.5711,
94
+ "eval_samples_per_second": 57.405,
95
+ "eval_steps_per_second": 1.96,
96
  "step": 72
97
  },
98
  {
99
  "epoch": 5.52,
100
  "learning_rate": 2.380952380952381e-05,
101
+ "loss": 0.8674,
102
  "step": 80
103
  },
104
  {
105
  "epoch": 6.0,
106
+ "eval_accuracy": 0.6780487804878049,
107
+ "eval_loss": 0.8766470551490784,
108
+ "eval_runtime": 3.5697,
109
+ "eval_samples_per_second": 57.428,
110
+ "eval_steps_per_second": 1.961,
111
  "step": 87
112
  },
113
  {
114
  "epoch": 6.21,
115
  "learning_rate": 1.984126984126984e-05,
116
+ "loss": 0.8807,
117
  "step": 90
118
  },
119
  {
120
  "epoch": 6.9,
121
  "learning_rate": 1.5873015873015872e-05,
122
+ "loss": 0.8638,
123
  "step": 100
124
  },
125
  {
126
  "epoch": 6.97,
127
+ "eval_accuracy": 0.6731707317073171,
128
+ "eval_loss": 0.865567684173584,
129
+ "eval_runtime": 3.828,
130
+ "eval_samples_per_second": 53.553,
131
+ "eval_steps_per_second": 1.829,
132
  "step": 101
133
  },
134
  {
135
  "epoch": 7.59,
136
  "learning_rate": 1.1904761904761905e-05,
137
+ "loss": 0.833,
138
  "step": 110
139
  },
140
  {
141
  "epoch": 8.0,
142
+ "eval_accuracy": 0.6731707317073171,
143
+ "eval_loss": 0.8395170569419861,
144
+ "eval_runtime": 3.5828,
145
+ "eval_samples_per_second": 57.218,
146
+ "eval_steps_per_second": 1.954,
147
  "step": 116
148
  },
149
  {
150
  "epoch": 8.28,
151
  "learning_rate": 7.936507936507936e-06,
152
+ "loss": 0.8396,
153
  "step": 120
154
  },
155
  {
156
  "epoch": 8.97,
157
  "learning_rate": 3.968253968253968e-06,
158
+ "loss": 0.8211,
159
  "step": 130
160
  },
161
  {
162
  "epoch": 8.97,
163
+ "eval_accuracy": 0.6926829268292682,
164
+ "eval_loss": 0.8203723430633545,
165
+ "eval_runtime": 3.633,
166
+ "eval_samples_per_second": 56.427,
167
+ "eval_steps_per_second": 1.927,
168
  "step": 130
169
  },
170
  {
171
  "epoch": 9.66,
172
  "learning_rate": 0.0,
173
+ "loss": 0.8236,
174
  "step": 140
175
  },
176
  {
177
  "epoch": 9.66,
178
+ "eval_accuracy": 0.6780487804878049,
179
+ "eval_loss": 0.8203750848770142,
180
+ "eval_runtime": 3.5738,
181
+ "eval_samples_per_second": 57.361,
182
+ "eval_steps_per_second": 1.959,
183
  "step": 140
184
  },
185
  {
186
  "epoch": 9.66,
187
  "step": 140,
188
  "total_flos": 5.78085766574506e+17,
189
+ "train_loss": 1.0145302023206437,
190
+ "train_runtime": 896.6945,
191
+ "train_samples_per_second": 20.509,
192
+ "train_steps_per_second": 0.156
193
  }
194
  ],
195
  "logging_steps": 10,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78c8073d0ca296061eeb2c1f9efe2310da5f052d3bfc061bd3372b205f4693f1
3
  size 4792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1577050422d312cadf11da4407c557f68886a726d97b4971bf7def3ccd26394
3
  size 4792