AnneMarie1 commited on
Commit
9d4ef70
1 Parent(s): 044e80e

End of training

Browse files
all_results.json CHANGED
@@ -1,8 +1,13 @@
1
  {
2
- "epoch": 2.95,
3
- "total_flos": 1.4272188589307658e+18,
4
- "train_loss": 0.7287208272351159,
5
- "train_runtime": 993.4233,
6
- "train_samples_per_second": 18.817,
7
- "train_steps_per_second": 0.145
 
 
 
 
 
8
  }
 
1
  {
2
+ "epoch": 4.92,
3
+ "eval_accuracy": 0.9845857418111753,
4
+ "eval_loss": 0.07430984824895859,
5
+ "eval_runtime": 60.6008,
6
+ "eval_samples_per_second": 51.385,
7
+ "eval_steps_per_second": 1.617,
8
+ "total_flos": 2.378233054601478e+18,
9
+ "train_loss": 0.6406697725256284,
10
+ "train_runtime": 1704.9827,
11
+ "train_samples_per_second": 18.273,
12
+ "train_steps_per_second": 0.141
13
  }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4.92,
3
+ "eval_accuracy": 0.9845857418111753,
4
+ "eval_loss": 0.07430984824895859,
5
+ "eval_runtime": 60.6008,
6
+ "eval_samples_per_second": 51.385,
7
+ "eval_steps_per_second": 1.617
8
+ }
runs/Mar29_15-56-05_f7c26454068d/events.out.tfevents.1680107179.f7c26454068d.1677.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:009275fe92ccff7d88487c22e47bf27cb3989f7a6624a64017d55e70dce3b947
3
+ size 363
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.95,
3
- "total_flos": 1.4272188589307658e+18,
4
- "train_loss": 0.7287208272351159,
5
- "train_runtime": 993.4233,
6
- "train_samples_per_second": 18.817,
7
- "train_steps_per_second": 0.145
8
  }
 
1
  {
2
+ "epoch": 4.92,
3
+ "total_flos": 2.378233054601478e+18,
4
+ "train_loss": 0.6406697725256284,
5
+ "train_runtime": 1704.9827,
6
+ "train_samples_per_second": 18.273,
7
+ "train_steps_per_second": 0.141
8
  }
trainer_state.json CHANGED
@@ -1,136 +1,214 @@
1
  {
2
- "best_metric": 0.9605009633911368,
3
- "best_model_checkpoint": "clip-vit-large-patch14-finetuned-fruits-360_vitlarge/checkpoint-144",
4
- "epoch": 2.953846153846154,
5
- "global_step": 144,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.21,
12
- "learning_rate": 3.3333333333333335e-05,
13
- "loss": 1.991,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.41,
18
- "learning_rate": 4.8062015503875976e-05,
19
- "loss": 1.4175,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.62,
24
- "learning_rate": 4.418604651162791e-05,
25
- "loss": 1.0701,
26
  "step": 30
27
  },
28
  {
29
  "epoch": 0.82,
30
- "learning_rate": 4.0310077519379843e-05,
31
- "loss": 0.8631,
32
  "step": 40
33
  },
34
  {
35
  "epoch": 0.98,
36
- "eval_accuracy": 0.852922286448298,
37
- "eval_loss": 0.4619566798210144,
38
- "eval_runtime": 62.7979,
39
- "eval_samples_per_second": 49.588,
40
- "eval_steps_per_second": 1.561,
41
  "step": 48
42
  },
43
  {
44
  "epoch": 1.03,
45
- "learning_rate": 3.6434108527131784e-05,
46
- "loss": 0.6585,
47
  "step": 50
48
  },
49
  {
50
  "epoch": 1.23,
51
- "learning_rate": 3.2558139534883724e-05,
52
- "loss": 0.6017,
53
  "step": 60
54
  },
55
  {
56
  "epoch": 1.44,
57
- "learning_rate": 2.868217054263566e-05,
58
- "loss": 0.6272,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 1.64,
63
- "learning_rate": 2.48062015503876e-05,
64
- "loss": 0.6237,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 1.85,
69
- "learning_rate": 2.0930232558139536e-05,
70
- "loss": 0.485,
71
  "step": 90
72
  },
73
  {
74
  "epoch": 1.99,
75
- "eval_accuracy": 0.9100834938985228,
76
- "eval_loss": 0.2783240079879761,
77
- "eval_runtime": 62.6573,
78
- "eval_samples_per_second": 49.699,
79
- "eval_steps_per_second": 1.564,
80
  "step": 97
81
  },
82
  {
83
  "epoch": 2.05,
84
- "learning_rate": 1.7054263565891473e-05,
85
- "loss": 0.4887,
86
  "step": 100
87
  },
88
  {
89
  "epoch": 2.26,
90
- "learning_rate": 1.3178294573643413e-05,
91
- "loss": 0.44,
92
  "step": 110
93
  },
94
  {
95
  "epoch": 2.46,
96
- "learning_rate": 9.302325581395349e-06,
97
- "loss": 0.4065,
98
  "step": 120
99
  },
100
  {
101
  "epoch": 2.67,
102
- "learning_rate": 5.426356589147287e-06,
103
- "loss": 0.3612,
104
  "step": 130
105
  },
106
  {
107
  "epoch": 2.87,
108
- "learning_rate": 1.550387596899225e-06,
109
- "loss": 0.3246,
110
  "step": 140
111
  },
112
  {
113
- "epoch": 2.95,
114
- "eval_accuracy": 0.9605009633911368,
115
- "eval_loss": 0.17322921752929688,
116
- "eval_runtime": 62.2033,
117
- "eval_samples_per_second": 50.062,
118
- "eval_steps_per_second": 1.575,
119
- "step": 144
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
120
  },
121
  {
122
- "epoch": 2.95,
123
- "step": 144,
124
- "total_flos": 1.4272188589307658e+18,
125
- "train_loss": 0.7287208272351159,
126
- "train_runtime": 993.4233,
127
- "train_samples_per_second": 18.817,
128
- "train_steps_per_second": 0.145
129
  }
130
  ],
131
- "max_steps": 144,
132
- "num_train_epochs": 3,
133
- "total_flos": 1.4272188589307658e+18,
134
  "trial_name": null,
135
  "trial_params": null
136
  }
 
1
  {
2
+ "best_metric": 0.9845857418111753,
3
+ "best_model_checkpoint": "clip-vit-large-patch14-finetuned-fruits-360_vitlarge/checkpoint-240",
4
+ "epoch": 4.923076923076923,
5
+ "global_step": 240,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.21,
12
+ "learning_rate": 2.0833333333333336e-05,
13
+ "loss": 2.7421,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.41,
18
+ "learning_rate": 4.166666666666667e-05,
19
+ "loss": 1.7164,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.62,
24
+ "learning_rate": 4.8611111111111115e-05,
25
+ "loss": 1.3248,
26
  "step": 30
27
  },
28
  {
29
  "epoch": 0.82,
30
+ "learning_rate": 4.62962962962963e-05,
31
+ "loss": 1.0674,
32
  "step": 40
33
  },
34
  {
35
  "epoch": 0.98,
36
+ "eval_accuracy": 0.7475915221579962,
37
+ "eval_loss": 0.6957976222038269,
38
+ "eval_runtime": 62.2188,
39
+ "eval_samples_per_second": 50.049,
40
+ "eval_steps_per_second": 1.575,
41
  "step": 48
42
  },
43
  {
44
  "epoch": 1.03,
45
+ "learning_rate": 4.3981481481481486e-05,
46
+ "loss": 0.8297,
47
  "step": 50
48
  },
49
  {
50
  "epoch": 1.23,
51
+ "learning_rate": 4.166666666666667e-05,
52
+ "loss": 0.718,
53
  "step": 60
54
  },
55
  {
56
  "epoch": 1.44,
57
+ "learning_rate": 3.935185185185186e-05,
58
+ "loss": 0.7231,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 1.64,
63
+ "learning_rate": 3.7037037037037037e-05,
64
+ "loss": 0.6447,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 1.85,
69
+ "learning_rate": 3.472222222222222e-05,
70
+ "loss": 0.5475,
71
  "step": 90
72
  },
73
  {
74
  "epoch": 1.99,
75
+ "eval_accuracy": 0.8542068079640334,
76
+ "eval_loss": 0.44836971163749695,
77
+ "eval_runtime": 64.139,
78
+ "eval_samples_per_second": 48.551,
79
+ "eval_steps_per_second": 1.528,
80
  "step": 97
81
  },
82
  {
83
  "epoch": 2.05,
84
+ "learning_rate": 3.240740740740741e-05,
85
+ "loss": 0.6017,
86
  "step": 100
87
  },
88
  {
89
  "epoch": 2.26,
90
+ "learning_rate": 3.0092592592592593e-05,
91
+ "loss": 0.5081,
92
  "step": 110
93
  },
94
  {
95
  "epoch": 2.46,
96
+ "learning_rate": 2.777777777777778e-05,
97
+ "loss": 0.4969,
98
  "step": 120
99
  },
100
  {
101
  "epoch": 2.67,
102
+ "learning_rate": 2.5462962962962965e-05,
103
+ "loss": 0.4153,
104
  "step": 130
105
  },
106
  {
107
  "epoch": 2.87,
108
+ "learning_rate": 2.314814814814815e-05,
109
+ "loss": 0.4065,
110
  "step": 140
111
  },
112
  {
113
+ "epoch": 2.99,
114
+ "eval_accuracy": 0.9274245343609505,
115
+ "eval_loss": 0.22493986785411835,
116
+ "eval_runtime": 63.0661,
117
+ "eval_samples_per_second": 49.377,
118
+ "eval_steps_per_second": 1.554,
119
+ "step": 146
120
+ },
121
+ {
122
+ "epoch": 3.08,
123
+ "learning_rate": 2.0833333333333336e-05,
124
+ "loss": 0.3714,
125
+ "step": 150
126
+ },
127
+ {
128
+ "epoch": 3.28,
129
+ "learning_rate": 1.8518518518518518e-05,
130
+ "loss": 0.3319,
131
+ "step": 160
132
+ },
133
+ {
134
+ "epoch": 3.49,
135
+ "learning_rate": 1.6203703703703704e-05,
136
+ "loss": 0.3135,
137
+ "step": 170
138
+ },
139
+ {
140
+ "epoch": 3.69,
141
+ "learning_rate": 1.388888888888889e-05,
142
+ "loss": 0.2645,
143
+ "step": 180
144
+ },
145
+ {
146
+ "epoch": 3.9,
147
+ "learning_rate": 1.1574074074074075e-05,
148
+ "loss": 0.2386,
149
+ "step": 190
150
+ },
151
+ {
152
+ "epoch": 4.0,
153
+ "eval_accuracy": 0.9723827874116892,
154
+ "eval_loss": 0.11541179567575455,
155
+ "eval_runtime": 63.0456,
156
+ "eval_samples_per_second": 49.393,
157
+ "eval_steps_per_second": 1.554,
158
+ "step": 195
159
+ },
160
+ {
161
+ "epoch": 4.1,
162
+ "learning_rate": 9.259259259259259e-06,
163
+ "loss": 0.2559,
164
+ "step": 200
165
+ },
166
+ {
167
+ "epoch": 4.31,
168
+ "learning_rate": 6.944444444444445e-06,
169
+ "loss": 0.2543,
170
+ "step": 210
171
+ },
172
+ {
173
+ "epoch": 4.51,
174
+ "learning_rate": 4.6296296296296296e-06,
175
+ "loss": 0.2274,
176
+ "step": 220
177
+ },
178
+ {
179
+ "epoch": 4.72,
180
+ "learning_rate": 2.3148148148148148e-06,
181
+ "loss": 0.1793,
182
+ "step": 230
183
+ },
184
+ {
185
+ "epoch": 4.92,
186
+ "learning_rate": 0.0,
187
+ "loss": 0.197,
188
+ "step": 240
189
+ },
190
+ {
191
+ "epoch": 4.92,
192
+ "eval_accuracy": 0.9845857418111753,
193
+ "eval_loss": 0.07430984824895859,
194
+ "eval_runtime": 62.3565,
195
+ "eval_samples_per_second": 49.939,
196
+ "eval_steps_per_second": 1.572,
197
+ "step": 240
198
  },
199
  {
200
+ "epoch": 4.92,
201
+ "step": 240,
202
+ "total_flos": 2.378233054601478e+18,
203
+ "train_loss": 0.6406697725256284,
204
+ "train_runtime": 1704.9827,
205
+ "train_samples_per_second": 18.273,
206
+ "train_steps_per_second": 0.141
207
  }
208
  ],
209
+ "max_steps": 240,
210
+ "num_train_epochs": 5,
211
+ "total_flos": 2.378233054601478e+18,
212
  "trial_name": null,
213
  "trial_params": null
214
  }