rshrott commited on
Commit
ff9cd40
1 Parent(s): 9f9f939

🍻 cheers

Browse files
README.md CHANGED
@@ -2,6 +2,7 @@
2
  license: apache-2.0
3
  base_model: google/vit-base-patch16-224-in21k
4
  tags:
 
5
  - generated_from_trainer
6
  model-index:
7
  - name: ryan_model314_3
@@ -13,7 +14,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # ryan_model314_3
15
 
16
- This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the None dataset.
17
  It achieves the following results on the evaluation set:
18
  - Loss: 0.2750
19
  - Na Accuracy: 0.931
 
2
  license: apache-2.0
3
  base_model: google/vit-base-patch16-224-in21k
4
  tags:
5
+ - image-classification
6
  - generated_from_trainer
7
  model-index:
8
  - name: ryan_model314_3
 
14
 
15
  # ryan_model314_3
16
 
17
+ This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the beans dataset.
18
  It achieves the following results on the evaluation set:
19
  - Loss: 0.2750
20
  - Na Accuracy: 0.931
all_results.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
- "epoch": 2.0,
3
- "eval_loss": 0.2744598984718323,
4
- "eval_na_accuracy": 0.96,
5
- "eval_ordinal_accuracy": 0.5108695652173914,
6
- "eval_ordinal_mae": 0.5806456123182611,
7
- "eval_runtime": 4.777,
8
- "eval_samples_per_second": 20.934,
9
- "eval_steps_per_second": 2.721,
10
- "train_loss": 0.32528334193759495,
11
- "train_runtime": 229.1686,
12
- "train_samples_per_second": 8.727,
13
- "train_steps_per_second": 0.55
14
  }
 
1
  {
2
+ "epoch": 0.88,
3
+ "eval_loss": 0.2750368118286133,
4
+ "eval_na_accuracy": 0.931,
5
+ "eval_ordinal_accuracy": 0.6271379703534777,
6
+ "eval_ordinal_mae": 0.5319093595330124,
7
+ "eval_runtime": 42.4663,
8
+ "eval_samples_per_second": 23.548,
9
+ "eval_steps_per_second": 2.944,
10
+ "train_loss": 0.3000895881652832,
11
+ "train_runtime": 2172.3633,
12
+ "train_samples_per_second": 9.207,
13
+ "train_steps_per_second": 0.575
14
  }
eval_results.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "epoch": 2.0,
3
- "eval_loss": 0.2744598984718323,
4
- "eval_na_accuracy": 0.96,
5
- "eval_ordinal_accuracy": 0.5108695652173914,
6
- "eval_ordinal_mae": 0.5806456123182611,
7
- "eval_runtime": 4.777,
8
- "eval_samples_per_second": 20.934,
9
- "eval_steps_per_second": 2.721
10
  }
 
1
  {
2
+ "epoch": 0.88,
3
+ "eval_loss": 0.2750368118286133,
4
+ "eval_na_accuracy": 0.931,
5
+ "eval_ordinal_accuracy": 0.6271379703534777,
6
+ "eval_ordinal_mae": 0.5319093595330124,
7
+ "eval_runtime": 42.4663,
8
+ "eval_samples_per_second": 23.548,
9
+ "eval_steps_per_second": 2.944
10
  }
runs/Mar27_08-05-10_ryanserver/events.out.tfevents.1711543379.ryanserver.8800.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a0cebfd799724c7fc5edf6d1e013bdec3501d228ae92a969b732af9bb19da0e
3
+ size 529
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 2.0,
3
- "train_loss": 0.32528334193759495,
4
- "train_runtime": 229.1686,
5
- "train_samples_per_second": 8.727,
6
- "train_steps_per_second": 0.55
7
  }
 
1
  {
2
+ "epoch": 0.88,
3
+ "train_loss": 0.3000895881652832,
4
+ "train_runtime": 2172.3633,
5
+ "train_samples_per_second": 9.207,
6
+ "train_steps_per_second": 0.575
7
  }
trainer_state.json CHANGED
@@ -1,65 +1,227 @@
1
  {
2
- "best_metric": 0.2744598984718323,
3
- "best_model_checkpoint": "./ryan_model314_3/checkpoint-100",
4
- "epoch": 2.0,
5
  "eval_steps": 50,
6
- "global_step": 126,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.79,
13
- "grad_norm": 0.808198094367981,
14
- "learning_rate": 0.00012063492063492063,
15
- "loss": 0.4094,
16
  "step": 50
17
  },
18
  {
19
- "epoch": 0.79,
20
- "eval_loss": 0.31280139088630676,
21
- "eval_na_accuracy": 0.94,
22
- "eval_ordinal_accuracy": 0.40217391304347827,
23
- "eval_ordinal_mae": 0.6332903986837229,
24
- "eval_runtime": 11.6495,
25
- "eval_samples_per_second": 8.584,
26
- "eval_steps_per_second": 1.116,
27
  "step": 50
28
  },
29
  {
30
- "epoch": 1.59,
31
- "grad_norm": 0.8316417336463928,
32
- "learning_rate": 4.126984126984127e-05,
33
- "loss": 0.29,
34
  "step": 100
35
  },
36
  {
37
- "epoch": 1.59,
38
- "eval_loss": 0.2744598984718323,
39
- "eval_na_accuracy": 0.96,
40
- "eval_ordinal_accuracy": 0.5108695652173914,
41
- "eval_ordinal_mae": 0.5806456123182611,
42
- "eval_runtime": 4.1502,
43
- "eval_samples_per_second": 24.095,
44
- "eval_steps_per_second": 3.132,
45
  "step": 100
46
  },
47
  {
48
- "epoch": 2.0,
49
- "step": 126,
50
- "total_flos": 1.5498953551872e+17,
51
- "train_loss": 0.32528334193759495,
52
- "train_runtime": 229.1686,
53
- "train_samples_per_second": 8.727,
54
- "train_steps_per_second": 0.55
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
55
  }
56
  ],
57
  "logging_steps": 50,
58
- "max_steps": 126,
59
  "num_input_tokens_seen": 0,
60
  "num_train_epochs": 2,
61
  "save_steps": 50,
62
- "total_flos": 1.5498953551872e+17,
63
  "train_batch_size": 16,
64
  "trial_name": null,
65
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.2750368118286133,
3
+ "best_model_checkpoint": "./ryan_model314_3/checkpoint-550",
4
+ "epoch": 0.88,
5
  "eval_steps": 50,
6
+ "global_step": 550,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.08,
13
+ "grad_norm": 1.5017586946487427,
14
+ "learning_rate": 0.000192,
15
+ "loss": 0.4423,
16
  "step": 50
17
  },
18
  {
19
+ "epoch": 0.08,
20
+ "eval_loss": 0.33861014246940613,
21
+ "eval_na_accuracy": 0.904,
22
+ "eval_ordinal_accuracy": 0.4629418472063854,
23
+ "eval_ordinal_mae": 0.6577621472191316,
24
+ "eval_runtime": 123.3898,
25
+ "eval_samples_per_second": 8.104,
26
+ "eval_steps_per_second": 1.013,
27
  "step": 50
28
  },
29
  {
30
+ "epoch": 0.16,
31
+ "grad_norm": 0.8501819372177124,
32
+ "learning_rate": 0.00018400000000000003,
33
+ "loss": 0.3088,
34
  "step": 100
35
  },
36
  {
37
+ "epoch": 0.16,
38
+ "eval_loss": 0.3268783390522003,
39
+ "eval_na_accuracy": 0.928,
40
+ "eval_ordinal_accuracy": 0.5370581527936146,
41
+ "eval_ordinal_mae": 0.5969413880658287,
42
+ "eval_runtime": 43.4997,
43
+ "eval_samples_per_second": 22.989,
44
+ "eval_steps_per_second": 2.874,
45
  "step": 100
46
  },
47
  {
48
+ "epoch": 0.24,
49
+ "grad_norm": 0.5424334406852722,
50
+ "learning_rate": 0.00017600000000000002,
51
+ "loss": 0.316,
52
+ "step": 150
53
+ },
54
+ {
55
+ "epoch": 0.24,
56
+ "eval_loss": 0.3395713269710541,
57
+ "eval_na_accuracy": 0.902,
58
+ "eval_ordinal_accuracy": 0.5142531356898518,
59
+ "eval_ordinal_mae": 0.6323422620227872,
60
+ "eval_runtime": 43.339,
61
+ "eval_samples_per_second": 23.074,
62
+ "eval_steps_per_second": 2.884,
63
+ "step": 150
64
+ },
65
+ {
66
+ "epoch": 0.32,
67
+ "grad_norm": 1.2484453916549683,
68
+ "learning_rate": 0.000168,
69
+ "loss": 0.2821,
70
+ "step": 200
71
+ },
72
+ {
73
+ "epoch": 0.32,
74
+ "eval_loss": 0.32339948415756226,
75
+ "eval_na_accuracy": 0.927,
76
+ "eval_ordinal_accuracy": 0.5131128848346637,
77
+ "eval_ordinal_mae": 0.6292874569299393,
78
+ "eval_runtime": 42.0004,
79
+ "eval_samples_per_second": 23.809,
80
+ "eval_steps_per_second": 2.976,
81
+ "step": 200
82
+ },
83
+ {
84
+ "epoch": 0.4,
85
+ "grad_norm": 1.4807660579681396,
86
+ "learning_rate": 0.00016,
87
+ "loss": 0.2731,
88
+ "step": 250
89
+ },
90
+ {
91
+ "epoch": 0.4,
92
+ "eval_loss": 0.3313509225845337,
93
+ "eval_na_accuracy": 0.925,
94
+ "eval_ordinal_accuracy": 0.508551881413911,
95
+ "eval_ordinal_mae": 0.5856009521101041,
96
+ "eval_runtime": 55.6564,
97
+ "eval_samples_per_second": 17.967,
98
+ "eval_steps_per_second": 2.246,
99
+ "step": 250
100
+ },
101
+ {
102
+ "epoch": 0.48,
103
+ "grad_norm": 1.4179209470748901,
104
+ "learning_rate": 0.000152,
105
+ "loss": 0.2975,
106
+ "step": 300
107
+ },
108
+ {
109
+ "epoch": 0.48,
110
+ "eval_loss": 0.3036611080169678,
111
+ "eval_na_accuracy": 0.927,
112
+ "eval_ordinal_accuracy": 0.5963511972633979,
113
+ "eval_ordinal_mae": 0.5690023564742932,
114
+ "eval_runtime": 42.7034,
115
+ "eval_samples_per_second": 23.417,
116
+ "eval_steps_per_second": 2.927,
117
+ "step": 300
118
+ },
119
+ {
120
+ "epoch": 0.56,
121
+ "grad_norm": 0.7659221887588501,
122
+ "learning_rate": 0.000144,
123
+ "loss": 0.2609,
124
+ "step": 350
125
+ },
126
+ {
127
+ "epoch": 0.56,
128
+ "eval_loss": 0.3209022283554077,
129
+ "eval_na_accuracy": 0.928,
130
+ "eval_ordinal_accuracy": 0.5450399087799316,
131
+ "eval_ordinal_mae": 0.5764862077817825,
132
+ "eval_runtime": 43.1206,
133
+ "eval_samples_per_second": 23.191,
134
+ "eval_steps_per_second": 2.899,
135
+ "step": 350
136
+ },
137
+ {
138
+ "epoch": 0.64,
139
+ "grad_norm": 1.0847711563110352,
140
+ "learning_rate": 0.00013600000000000003,
141
+ "loss": 0.287,
142
+ "step": 400
143
+ },
144
+ {
145
+ "epoch": 0.64,
146
+ "eval_loss": 0.29075464606285095,
147
+ "eval_na_accuracy": 0.931,
148
+ "eval_ordinal_accuracy": 0.5826681870011402,
149
+ "eval_ordinal_mae": 0.5458187616535902,
150
+ "eval_runtime": 42.3269,
151
+ "eval_samples_per_second": 23.626,
152
+ "eval_steps_per_second": 2.953,
153
+ "step": 400
154
+ },
155
+ {
156
+ "epoch": 0.72,
157
+ "grad_norm": 0.9720218181610107,
158
+ "learning_rate": 0.00012800000000000002,
159
+ "loss": 0.2905,
160
+ "step": 450
161
+ },
162
+ {
163
+ "epoch": 0.72,
164
+ "eval_loss": 0.30074238777160645,
165
+ "eval_na_accuracy": 0.919,
166
+ "eval_ordinal_accuracy": 0.5986316989737742,
167
+ "eval_ordinal_mae": 0.548372159519042,
168
+ "eval_runtime": 76.7524,
169
+ "eval_samples_per_second": 13.029,
170
+ "eval_steps_per_second": 1.629,
171
+ "step": 450
172
+ },
173
+ {
174
+ "epoch": 0.8,
175
+ "grad_norm": 0.8414099216461182,
176
+ "learning_rate": 0.00012,
177
+ "loss": 0.2574,
178
+ "step": 500
179
+ },
180
+ {
181
+ "epoch": 0.8,
182
+ "eval_loss": 0.28344637155532837,
183
+ "eval_na_accuracy": 0.929,
184
+ "eval_ordinal_accuracy": 0.6031927023945268,
185
+ "eval_ordinal_mae": 0.5363022306512,
186
+ "eval_runtime": 42.8484,
187
+ "eval_samples_per_second": 23.338,
188
+ "eval_steps_per_second": 2.917,
189
+ "step": 500
190
+ },
191
+ {
192
+ "epoch": 0.88,
193
+ "grad_norm": 0.5895617604255676,
194
+ "learning_rate": 0.00011200000000000001,
195
+ "loss": 0.2855,
196
+ "step": 550
197
+ },
198
+ {
199
+ "epoch": 0.88,
200
+ "eval_loss": 0.2750368118286133,
201
+ "eval_na_accuracy": 0.931,
202
+ "eval_ordinal_accuracy": 0.6271379703534777,
203
+ "eval_ordinal_mae": 0.5319093595330124,
204
+ "eval_runtime": 42.3171,
205
+ "eval_samples_per_second": 23.631,
206
+ "eval_steps_per_second": 2.954,
207
+ "step": 550
208
+ },
209
+ {
210
+ "epoch": 0.88,
211
+ "step": 550,
212
+ "total_flos": 6.81953956282368e+17,
213
+ "train_loss": 0.3000895881652832,
214
+ "train_runtime": 2172.3633,
215
+ "train_samples_per_second": 9.207,
216
+ "train_steps_per_second": 0.575
217
  }
218
  ],
219
  "logging_steps": 50,
220
+ "max_steps": 1250,
221
  "num_input_tokens_seen": 0,
222
  "num_train_epochs": 2,
223
  "save_steps": 50,
224
+ "total_flos": 6.81953956282368e+17,
225
  "train_batch_size": 16,
226
  "trial_name": null,
227
  "trial_params": null