rshrott commited on
Commit
a5905b8
1 Parent(s): cdde9ee

🍻 cheers

Browse files
README.md CHANGED
@@ -2,6 +2,7 @@
2
  license: apache-2.0
3
  base_model: google/vit-base-patch16-224-in21k
4
  tags:
 
5
  - generated_from_trainer
6
  model-index:
7
  - name: ryan_model314_3
@@ -13,7 +14,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # ryan_model314_3
15
 
16
- This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the None dataset.
17
  It achieves the following results on the evaluation set:
18
  - Loss: 0.2696
19
  - Na Accuracy: 0.96
 
2
  license: apache-2.0
3
  base_model: google/vit-base-patch16-224-in21k
4
  tags:
5
+ - image-classification
6
  - generated_from_trainer
7
  model-index:
8
  - name: ryan_model314_3
 
14
 
15
  # ryan_model314_3
16
 
17
+ This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the beans dataset.
18
  It achieves the following results on the evaluation set:
19
  - Loss: 0.2696
20
  - Na Accuracy: 0.96
all_results.json CHANGED
@@ -1,13 +1,14 @@
1
  {
2
- "epoch": 0.51,
3
- "eval_loss": 0.2651739716529846,
4
- "eval_na_accuracy": 0.9371701432520734,
5
- "eval_ordinal_mae": 1.021151511080242,
6
- "eval_runtime": 162.3376,
7
- "eval_samples_per_second": 24.511,
8
- "eval_steps_per_second": 3.068,
9
- "train_loss": 0.29898834055120294,
10
- "train_runtime": 4048.1416,
11
- "train_samples_per_second": 34.064,
12
- "train_steps_per_second": 2.129
 
13
  }
 
1
  {
2
+ "epoch": 2.0,
3
+ "eval_loss": 0.2696247398853302,
4
+ "eval_na_accuracy": 0.96,
5
+ "eval_ordinal_accuracy": 0.5,
6
+ "eval_ordinal_mae": 1.168388410445914,
7
+ "eval_runtime": 4.4189,
8
+ "eval_samples_per_second": 22.63,
9
+ "eval_steps_per_second": 2.942,
10
+ "train_loss": 0.3214722058129689,
11
+ "train_runtime": 262.7567,
12
+ "train_samples_per_second": 7.612,
13
+ "train_steps_per_second": 0.48
14
  }
eval_results.json CHANGED
@@ -1,9 +1,10 @@
1
  {
2
- "epoch": 0.51,
3
- "eval_loss": 0.2651739716529846,
4
- "eval_na_accuracy": 0.9371701432520734,
5
- "eval_ordinal_mae": 1.021151511080242,
6
- "eval_runtime": 162.3376,
7
- "eval_samples_per_second": 24.511,
8
- "eval_steps_per_second": 3.068
 
9
  }
 
1
  {
2
+ "epoch": 2.0,
3
+ "eval_loss": 0.2696247398853302,
4
+ "eval_na_accuracy": 0.96,
5
+ "eval_ordinal_accuracy": 0.5,
6
+ "eval_ordinal_mae": 1.168388410445914,
7
+ "eval_runtime": 4.4189,
8
+ "eval_samples_per_second": 22.63,
9
+ "eval_steps_per_second": 2.942
10
  }
runs/Mar27_07-38-15_ryanserver/events.out.tfevents.1711539836.ryanserver.4146.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f857d222c6c7045f0baeea737e138c33ca42010ed029a92f0da9178649dc6d9c
3
+ size 521
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 0.51,
3
- "train_loss": 0.29898834055120294,
4
- "train_runtime": 4048.1416,
5
- "train_samples_per_second": 34.064,
6
- "train_steps_per_second": 2.129
7
  }
 
1
  {
2
+ "epoch": 2.0,
3
+ "train_loss": 0.3214722058129689,
4
+ "train_runtime": 262.7567,
5
+ "train_samples_per_second": 7.612,
6
+ "train_steps_per_second": 0.48
7
  }
trainer_state.json CHANGED
@@ -1,216 +1,65 @@
1
  {
2
- "best_metric": 0.2651739716529846,
3
- "best_model_checkpoint": "./ryan_model314_3/checkpoint-1000",
4
- "epoch": 0.5104408352668214,
5
- "eval_steps": 100,
6
- "global_step": 1100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.05,
13
- "grad_norm": 1.358393669128418,
14
- "learning_rate": 0.00019767981438515082,
15
- "loss": 0.3676,
16
- "step": 100
17
- },
18
- {
19
- "epoch": 0.05,
20
- "eval_loss": 0.34232085943222046,
21
- "eval_na_accuracy": 0.9273686855993968,
22
- "eval_ordinal_mae": 1.1293019706063574,
23
- "eval_runtime": 381.3744,
24
- "eval_samples_per_second": 10.433,
25
- "eval_steps_per_second": 1.306,
26
- "step": 100
27
- },
28
- {
29
- "epoch": 0.09,
30
- "grad_norm": 0.9884235262870789,
31
- "learning_rate": 0.00019535962877030162,
32
- "loss": 0.3329,
33
- "step": 200
34
- },
35
- {
36
- "epoch": 0.09,
37
- "eval_loss": 0.31356191635131836,
38
- "eval_na_accuracy": 0.9313897964312642,
39
- "eval_ordinal_mae": 1.070580373245832,
40
- "eval_runtime": 164.3074,
41
- "eval_samples_per_second": 24.217,
42
- "eval_steps_per_second": 3.031,
43
- "step": 200
44
- },
45
- {
46
- "epoch": 0.14,
47
- "grad_norm": 1.2422517538070679,
48
- "learning_rate": 0.00019303944315545243,
49
- "loss": 0.3134,
50
- "step": 300
51
- },
52
- {
53
- "epoch": 0.14,
54
- "eval_loss": 0.3302006423473358,
55
- "eval_na_accuracy": 0.9165619502387534,
56
- "eval_ordinal_mae": 1.1219553900231423,
57
- "eval_runtime": 164.3869,
58
- "eval_samples_per_second": 24.205,
59
- "eval_steps_per_second": 3.029,
60
- "step": 300
61
- },
62
- {
63
- "epoch": 0.19,
64
- "grad_norm": 1.1815475225448608,
65
- "learning_rate": 0.00019071925754060324,
66
- "loss": 0.314,
67
- "step": 400
68
- },
69
- {
70
- "epoch": 0.19,
71
- "eval_loss": 0.2992381155490875,
72
- "eval_na_accuracy": 0.9256094496104549,
73
- "eval_ordinal_mae": 0.820222080006495,
74
- "eval_runtime": 165.1522,
75
- "eval_samples_per_second": 24.093,
76
- "eval_steps_per_second": 3.015,
77
- "step": 400
78
- },
79
- {
80
- "epoch": 0.23,
81
- "grad_norm": 0.47366032004356384,
82
- "learning_rate": 0.00018839907192575407,
83
- "loss": 0.2965,
84
- "step": 500
85
- },
86
- {
87
- "epoch": 0.23,
88
- "eval_loss": 0.319803923368454,
89
- "eval_na_accuracy": 0.9248554913294798,
90
- "eval_ordinal_mae": 1.2210362517446196,
91
- "eval_runtime": 163.23,
92
- "eval_samples_per_second": 24.377,
93
- "eval_steps_per_second": 3.051,
94
- "step": 500
95
  },
96
  {
97
- "epoch": 0.28,
98
- "grad_norm": 1.8707951307296753,
99
- "learning_rate": 0.00018607888631090488,
100
- "loss": 0.3068,
101
- "step": 600
 
 
 
 
102
  },
103
  {
104
- "epoch": 0.28,
105
- "eval_loss": 0.26730772852897644,
106
- "eval_na_accuracy": 0.9371701432520734,
107
- "eval_ordinal_mae": 1.103637127990878,
108
- "eval_runtime": 160.1368,
109
- "eval_samples_per_second": 24.848,
110
- "eval_steps_per_second": 3.11,
111
- "step": 600
112
- },
113
- {
114
- "epoch": 0.32,
115
- "grad_norm": 1.1020443439483643,
116
- "learning_rate": 0.0001837587006960557,
117
- "loss": 0.2824,
118
- "step": 700
119
- },
120
- {
121
- "epoch": 0.32,
122
- "eval_loss": 0.2921823561191559,
123
- "eval_na_accuracy": 0.9371701432520734,
124
- "eval_ordinal_mae": 1.4977284913306896,
125
- "eval_runtime": 163.7628,
126
- "eval_samples_per_second": 24.297,
127
- "eval_steps_per_second": 3.041,
128
- "step": 700
129
- },
130
- {
131
- "epoch": 0.37,
132
- "grad_norm": 1.2855117321014404,
133
- "learning_rate": 0.0001814385150812065,
134
- "loss": 0.2914,
135
- "step": 800
136
- },
137
- {
138
- "epoch": 0.37,
139
- "eval_loss": 0.2798122763633728,
140
- "eval_na_accuracy": 0.9384267403870319,
141
- "eval_ordinal_mae": 0.7788859930601368,
142
- "eval_runtime": 163.524,
143
- "eval_samples_per_second": 24.333,
144
- "eval_steps_per_second": 3.045,
145
- "step": 800
146
- },
147
- {
148
- "epoch": 0.42,
149
- "grad_norm": 1.4634666442871094,
150
- "learning_rate": 0.00017911832946635733,
151
- "loss": 0.2968,
152
- "step": 900
153
- },
154
- {
155
- "epoch": 0.42,
156
- "eval_loss": 0.27096793055534363,
157
- "eval_na_accuracy": 0.9369188238250816,
158
- "eval_ordinal_mae": 0.9694435305190251,
159
- "eval_runtime": 163.2761,
160
- "eval_samples_per_second": 24.37,
161
- "eval_steps_per_second": 3.05,
162
- "step": 900
163
- },
164
- {
165
- "epoch": 0.46,
166
- "grad_norm": 0.3547471761703491,
167
- "learning_rate": 0.00017679814385150814,
168
- "loss": 0.2433,
169
- "step": 1000
170
- },
171
- {
172
- "epoch": 0.46,
173
- "eval_loss": 0.2651739716529846,
174
- "eval_na_accuracy": 0.9371701432520734,
175
- "eval_ordinal_mae": 1.021151511080242,
176
- "eval_runtime": 165.2163,
177
- "eval_samples_per_second": 24.084,
178
- "eval_steps_per_second": 3.014,
179
- "step": 1000
180
- },
181
- {
182
- "epoch": 0.51,
183
- "grad_norm": 0.6242479085922241,
184
- "learning_rate": 0.00017447795823665894,
185
- "loss": 0.2438,
186
- "step": 1100
187
  },
188
  {
189
- "epoch": 0.51,
190
- "eval_loss": 0.2782880365848541,
191
- "eval_na_accuracy": 0.9389293792410154,
192
- "eval_ordinal_mae": 0.8154305260353155,
193
- "eval_runtime": 161.9425,
194
- "eval_samples_per_second": 24.57,
195
- "eval_steps_per_second": 3.075,
196
- "step": 1100
 
197
  },
198
  {
199
- "epoch": 0.51,
200
- "step": 1100,
201
- "total_flos": 1.363907912564736e+18,
202
- "train_loss": 0.29898834055120294,
203
- "train_runtime": 4048.1416,
204
- "train_samples_per_second": 34.064,
205
- "train_steps_per_second": 2.129
206
  }
207
  ],
208
- "logging_steps": 100,
209
- "max_steps": 8620,
210
  "num_input_tokens_seen": 0,
211
- "num_train_epochs": 4,
212
- "save_steps": 100,
213
- "total_flos": 1.363907912564736e+18,
214
  "train_batch_size": 16,
215
  "trial_name": null,
216
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.2696247398853302,
3
+ "best_model_checkpoint": "./ryan_model314_3/checkpoint-100",
4
+ "epoch": 2.0,
5
+ "eval_steps": 50,
6
+ "global_step": 126,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.79,
13
+ "grad_norm": 0.766051709651947,
14
+ "learning_rate": 0.00012063492063492063,
15
+ "loss": 0.4088,
16
+ "step": 50
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
17
  },
18
  {
19
+ "epoch": 0.79,
20
+ "eval_loss": 0.30989590287208557,
21
+ "eval_na_accuracy": 0.93,
22
+ "eval_ordinal_accuracy": 0.43478260869565216,
23
+ "eval_ordinal_mae": 1.1052913616381967,
24
+ "eval_runtime": 14.2973,
25
+ "eval_samples_per_second": 6.994,
26
+ "eval_steps_per_second": 0.909,
27
+ "step": 50
28
  },
29
  {
30
+ "epoch": 1.59,
31
+ "grad_norm": 0.8156992793083191,
32
+ "learning_rate": 4.126984126984127e-05,
33
+ "loss": 0.2813,
34
+ "step": 100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
35
  },
36
  {
37
+ "epoch": 1.59,
38
+ "eval_loss": 0.2696247398853302,
39
+ "eval_na_accuracy": 0.96,
40
+ "eval_ordinal_accuracy": 0.5,
41
+ "eval_ordinal_mae": 1.168388410445914,
42
+ "eval_runtime": 4.0273,
43
+ "eval_samples_per_second": 24.831,
44
+ "eval_steps_per_second": 3.228,
45
+ "step": 100
46
  },
47
  {
48
+ "epoch": 2.0,
49
+ "step": 126,
50
+ "total_flos": 1.5498953551872e+17,
51
+ "train_loss": 0.3214722058129689,
52
+ "train_runtime": 262.7567,
53
+ "train_samples_per_second": 7.612,
54
+ "train_steps_per_second": 0.48
55
  }
56
  ],
57
+ "logging_steps": 50,
58
+ "max_steps": 126,
59
  "num_input_tokens_seen": 0,
60
+ "num_train_epochs": 2,
61
+ "save_steps": 50,
62
+ "total_flos": 1.5498953551872e+17,
63
  "train_batch_size": 16,
64
  "trial_name": null,
65
  "trial_params": null