Woleek commited on
Commit
ef4491d
1 Parent(s): d079a12

Training in progress, step 100

Browse files
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 20.0,
3
- "eval_accuracy": 0.8095238095238095,
4
- "eval_loss": 0.5754128098487854,
5
- "eval_runtime": 1.4452,
6
- "eval_samples_per_second": 14.531,
7
- "eval_steps_per_second": 2.076,
8
- "train_loss": 0.10162481290883281,
9
- "train_runtime": 67.7444,
10
- "train_samples_per_second": 10.333,
11
- "train_steps_per_second": 2.657
12
  }
 
1
  {
2
  "epoch": 20.0,
3
+ "eval_accuracy": 0.8181818181818182,
4
+ "eval_loss": 0.7126299142837524,
5
+ "eval_runtime": 1.7324,
6
+ "eval_samples_per_second": 19.048,
7
+ "eval_steps_per_second": 2.886,
8
+ "train_loss": 0.1071862239856273,
9
+ "train_runtime": 140.5527,
10
+ "train_samples_per_second": 7.826,
11
+ "train_steps_per_second": 1.992
12
  }
config.json CHANGED
@@ -11,15 +11,16 @@
11
  "id2label": {
12
  "0": "airport",
13
  "1": "bathroom",
14
- "10": "zoo",
 
15
  "2": "beach",
16
  "3": "building_site",
17
  "4": "factory",
18
- "5": "house",
19
- "6": "office",
20
- "7": "road",
21
- "8": "skatepart",
22
- "9": "warehouse"
23
  },
24
  "image_size": 224,
25
  "initializer_range": 0.02,
@@ -30,12 +31,13 @@
30
  "beach": "2",
31
  "building_site": "3",
32
  "factory": "4",
33
- "house": "5",
34
- "office": "6",
35
- "road": "7",
36
- "skatepart": "8",
37
- "warehouse": "9",
38
- "zoo": "10"
 
39
  },
40
  "layer_norm_eps": 1e-12,
41
  "model_type": "vit",
 
11
  "id2label": {
12
  "0": "airport",
13
  "1": "bathroom",
14
+ "10": "warehouse",
15
+ "11": "zoo",
16
  "2": "beach",
17
  "3": "building_site",
18
  "4": "factory",
19
+ "5": "food",
20
+ "6": "house",
21
+ "7": "office",
22
+ "8": "road",
23
+ "9": "skatepart"
24
  },
25
  "image_size": 224,
26
  "initializer_range": 0.02,
 
31
  "beach": "2",
32
  "building_site": "3",
33
  "factory": "4",
34
+ "food": "5",
35
+ "house": "6",
36
+ "office": "7",
37
+ "road": "8",
38
+ "skatepart": "9",
39
+ "warehouse": "10",
40
+ "zoo": "11"
41
  },
42
  "layer_norm_eps": 1e-12,
43
  "model_type": "vit",
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 20.0,
3
- "eval_accuracy": 0.8095238095238095,
4
- "eval_loss": 0.5754128098487854,
5
- "eval_runtime": 1.4452,
6
- "eval_samples_per_second": 14.531,
7
- "eval_steps_per_second": 2.076
8
  }
 
1
  {
2
  "epoch": 20.0,
3
+ "eval_accuracy": 0.8181818181818182,
4
+ "eval_loss": 0.7126299142837524,
5
+ "eval_runtime": 1.7324,
6
+ "eval_samples_per_second": 19.048,
7
+ "eval_steps_per_second": 2.886
8
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ecf973856cc57db14758c3df45c75f913734fc524dbe970bde54e425009b7607
3
- size 343296365
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb7d6d4cc205243a7dd46e5aa1ed9c3eaf175f23b42b9b901fa82aec81c63dfd
3
+ size 343299437
runs/Aug24_10-33-53_surveily-ag-02/events.out.tfevents.1692866292.surveily-ag-02.15198.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd5cd4baca8bae7d76a8e6466d15637a557fcda9a7810bdb6cb232cc1adc3a50
3
+ size 411
runs/Aug24_12-31-14_surveily-ag-02/events.out.tfevents.1692873080.surveily-ag-02.7570.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dd0ba1524f351192fc1468005337fb5398628b521c7f8b603edd34a97a9ea92
3
+ size 6602
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 20.0,
3
- "train_loss": 0.10162481290883281,
4
- "train_runtime": 67.7444,
5
- "train_samples_per_second": 10.333,
6
- "train_steps_per_second": 2.657
7
  }
 
1
  {
2
  "epoch": 20.0,
3
+ "train_loss": 0.1071862239856273,
4
+ "train_runtime": 140.5527,
5
+ "train_samples_per_second": 7.826,
6
+ "train_steps_per_second": 1.992
7
  }
trainer_state.json CHANGED
@@ -1,142 +1,238 @@
1
  {
2
- "best_metric": 0.5754128098487854,
3
- "best_model_checkpoint": "./vit-base/checkpoint-100",
4
  "epoch": 20.0,
5
- "global_step": 180,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 1.11,
12
- "learning_rate": 0.00018888888888888888,
13
- "loss": 1.5669,
14
  "step": 10
15
  },
16
  {
17
- "epoch": 2.22,
18
- "learning_rate": 0.00017777777777777779,
19
- "loss": 0.2294,
20
  "step": 20
21
  },
22
  {
23
- "epoch": 3.33,
24
- "learning_rate": 0.0001666666666666667,
25
- "loss": 0.0267,
26
  "step": 30
27
  },
28
  {
29
- "epoch": 4.44,
30
- "learning_rate": 0.00015555555555555556,
31
- "loss": 0.002,
32
  "step": 40
33
  },
34
  {
35
- "epoch": 5.56,
36
- "learning_rate": 0.00014444444444444444,
37
- "loss": 0.0008,
38
  "step": 50
39
  },
40
  {
41
- "epoch": 6.67,
42
- "learning_rate": 0.00013333333333333334,
43
- "loss": 0.0005,
 
 
 
 
 
 
 
 
 
44
  "step": 60
45
  },
46
  {
47
- "epoch": 7.78,
48
- "learning_rate": 0.00012222222222222224,
49
- "loss": 0.0004,
50
  "step": 70
51
  },
52
  {
53
- "epoch": 8.89,
54
- "learning_rate": 0.00011111111111111112,
55
- "loss": 0.0003,
56
  "step": 80
57
  },
58
  {
59
- "epoch": 10.0,
60
- "learning_rate": 0.0001,
61
- "loss": 0.0003,
62
  "step": 90
63
  },
64
  {
65
- "epoch": 11.11,
66
- "learning_rate": 8.888888888888889e-05,
67
- "loss": 0.0003,
68
  "step": 100
69
  },
70
  {
71
- "epoch": 11.11,
72
- "eval_accuracy": 0.8095238095238095,
73
- "eval_loss": 0.5754128098487854,
74
- "eval_runtime": 1.0617,
75
- "eval_samples_per_second": 19.78,
76
- "eval_steps_per_second": 2.826,
77
  "step": 100
78
  },
79
  {
80
- "epoch": 12.22,
81
- "learning_rate": 7.777777777777778e-05,
82
- "loss": 0.0002,
83
  "step": 110
84
  },
85
  {
86
- "epoch": 13.33,
87
- "learning_rate": 6.666666666666667e-05,
88
- "loss": 0.0002,
89
  "step": 120
90
  },
91
  {
92
- "epoch": 14.44,
93
- "learning_rate": 5.555555555555556e-05,
94
- "loss": 0.0002,
95
  "step": 130
96
  },
97
  {
98
- "epoch": 15.56,
99
- "learning_rate": 4.4444444444444447e-05,
100
- "loss": 0.0002,
101
  "step": 140
102
  },
103
  {
104
- "epoch": 16.67,
105
- "learning_rate": 3.3333333333333335e-05,
106
- "loss": 0.0002,
107
  "step": 150
108
  },
109
  {
110
- "epoch": 17.78,
111
- "learning_rate": 2.2222222222222223e-05,
112
- "loss": 0.0002,
 
 
 
 
 
 
 
 
 
113
  "step": 160
114
  },
115
  {
116
- "epoch": 18.89,
117
- "learning_rate": 1.1111111111111112e-05,
118
- "loss": 0.0002,
119
  "step": 170
120
  },
121
  {
122
- "epoch": 20.0,
123
- "learning_rate": 0.0,
124
- "loss": 0.0002,
125
  "step": 180
126
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
127
  {
128
  "epoch": 20.0,
129
- "step": 180,
130
- "total_flos": 5.42468236068864e+16,
131
- "train_loss": 0.10162481290883281,
132
- "train_runtime": 67.7444,
133
- "train_samples_per_second": 10.333,
134
- "train_steps_per_second": 2.657
135
  }
136
  ],
137
- "max_steps": 180,
138
  "num_train_epochs": 20,
139
- "total_flos": 5.42468236068864e+16,
140
  "trial_name": null,
141
  "trial_params": null
142
  }
 
1
  {
2
+ "best_metric": 0.7126299142837524,
3
+ "best_model_checkpoint": "./vit-base/checkpoint-200",
4
  "epoch": 20.0,
5
+ "global_step": 280,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.71,
12
+ "learning_rate": 0.00019357142857142858,
13
+ "loss": 2.073,
14
  "step": 10
15
  },
16
  {
17
+ "epoch": 1.43,
18
+ "learning_rate": 0.00018642857142857144,
19
+ "loss": 0.6674,
20
  "step": 20
21
  },
22
  {
23
+ "epoch": 2.14,
24
+ "learning_rate": 0.0001792857142857143,
25
+ "loss": 0.1817,
26
  "step": 30
27
  },
28
  {
29
+ "epoch": 2.86,
30
+ "learning_rate": 0.00017214285714285717,
31
+ "loss": 0.0578,
32
  "step": 40
33
  },
34
  {
35
+ "epoch": 3.57,
36
+ "learning_rate": 0.000165,
37
+ "loss": 0.0041,
38
  "step": 50
39
  },
40
  {
41
+ "epoch": 3.57,
42
+ "eval_accuracy": 0.7575757575757576,
43
+ "eval_loss": 0.5183216333389282,
44
+ "eval_runtime": 1.6943,
45
+ "eval_samples_per_second": 19.477,
46
+ "eval_steps_per_second": 2.951,
47
+ "step": 50
48
+ },
49
+ {
50
+ "epoch": 4.29,
51
+ "learning_rate": 0.00015785714285714285,
52
+ "loss": 0.007,
53
  "step": 60
54
  },
55
  {
56
+ "epoch": 5.0,
57
+ "learning_rate": 0.0001507142857142857,
58
+ "loss": 0.0018,
59
  "step": 70
60
  },
61
  {
62
+ "epoch": 5.71,
63
+ "learning_rate": 0.0001435714285714286,
64
+ "loss": 0.0009,
65
  "step": 80
66
  },
67
  {
68
+ "epoch": 6.43,
69
+ "learning_rate": 0.00013642857142857144,
70
+ "loss": 0.0007,
71
  "step": 90
72
  },
73
  {
74
+ "epoch": 7.14,
75
+ "learning_rate": 0.0001292857142857143,
76
+ "loss": 0.0006,
77
  "step": 100
78
  },
79
  {
80
+ "epoch": 7.14,
81
+ "eval_accuracy": 0.8181818181818182,
82
+ "eval_loss": 0.7554123401641846,
83
+ "eval_runtime": 1.4254,
84
+ "eval_samples_per_second": 23.151,
85
+ "eval_steps_per_second": 3.508,
86
  "step": 100
87
  },
88
  {
89
+ "epoch": 7.86,
90
+ "learning_rate": 0.00012214285714285715,
91
+ "loss": 0.0005,
92
  "step": 110
93
  },
94
  {
95
+ "epoch": 8.57,
96
+ "learning_rate": 0.00011499999999999999,
97
+ "loss": 0.0005,
98
  "step": 120
99
  },
100
  {
101
+ "epoch": 9.29,
102
+ "learning_rate": 0.00010785714285714286,
103
+ "loss": 0.0004,
104
  "step": 130
105
  },
106
  {
107
+ "epoch": 10.0,
108
+ "learning_rate": 0.00010071428571428571,
109
+ "loss": 0.0004,
110
  "step": 140
111
  },
112
  {
113
+ "epoch": 10.71,
114
+ "learning_rate": 9.357142857142858e-05,
115
+ "loss": 0.0004,
116
  "step": 150
117
  },
118
  {
119
+ "epoch": 10.71,
120
+ "eval_accuracy": 0.8181818181818182,
121
+ "eval_loss": 0.7197360396385193,
122
+ "eval_runtime": 1.4885,
123
+ "eval_samples_per_second": 22.17,
124
+ "eval_steps_per_second": 3.359,
125
+ "step": 150
126
+ },
127
+ {
128
+ "epoch": 11.43,
129
+ "learning_rate": 8.642857142857143e-05,
130
+ "loss": 0.0004,
131
  "step": 160
132
  },
133
  {
134
+ "epoch": 12.14,
135
+ "learning_rate": 7.928571428571429e-05,
136
+ "loss": 0.0003,
137
  "step": 170
138
  },
139
  {
140
+ "epoch": 12.86,
141
+ "learning_rate": 7.214285714285714e-05,
142
+ "loss": 0.0003,
143
  "step": 180
144
  },
145
+ {
146
+ "epoch": 13.57,
147
+ "learning_rate": 6.500000000000001e-05,
148
+ "loss": 0.0003,
149
+ "step": 190
150
+ },
151
+ {
152
+ "epoch": 14.29,
153
+ "learning_rate": 5.785714285714287e-05,
154
+ "loss": 0.0003,
155
+ "step": 200
156
+ },
157
+ {
158
+ "epoch": 14.29,
159
+ "eval_accuracy": 0.8181818181818182,
160
+ "eval_loss": 0.7126299142837524,
161
+ "eval_runtime": 1.5758,
162
+ "eval_samples_per_second": 20.942,
163
+ "eval_steps_per_second": 3.173,
164
+ "step": 200
165
+ },
166
+ {
167
+ "epoch": 15.0,
168
+ "learning_rate": 5.0714285714285716e-05,
169
+ "loss": 0.0003,
170
+ "step": 210
171
+ },
172
+ {
173
+ "epoch": 15.71,
174
+ "learning_rate": 4.3571428571428576e-05,
175
+ "loss": 0.0003,
176
+ "step": 220
177
+ },
178
+ {
179
+ "epoch": 16.43,
180
+ "learning_rate": 3.642857142857143e-05,
181
+ "loss": 0.0003,
182
+ "step": 230
183
+ },
184
+ {
185
+ "epoch": 17.14,
186
+ "learning_rate": 2.9285714285714288e-05,
187
+ "loss": 0.0003,
188
+ "step": 240
189
+ },
190
+ {
191
+ "epoch": 17.86,
192
+ "learning_rate": 2.214285714285714e-05,
193
+ "loss": 0.0003,
194
+ "step": 250
195
+ },
196
+ {
197
+ "epoch": 17.86,
198
+ "eval_accuracy": 0.8181818181818182,
199
+ "eval_loss": 0.7098276615142822,
200
+ "eval_runtime": 1.5439,
201
+ "eval_samples_per_second": 21.374,
202
+ "eval_steps_per_second": 3.239,
203
+ "step": 250
204
+ },
205
+ {
206
+ "epoch": 18.57,
207
+ "learning_rate": 1.5e-05,
208
+ "loss": 0.0003,
209
+ "step": 260
210
+ },
211
+ {
212
+ "epoch": 19.29,
213
+ "learning_rate": 7.857142857142858e-06,
214
+ "loss": 0.0003,
215
+ "step": 270
216
+ },
217
+ {
218
+ "epoch": 20.0,
219
+ "learning_rate": 7.142857142857143e-07,
220
+ "loss": 0.0003,
221
+ "step": 280
222
+ },
223
  {
224
  "epoch": 20.0,
225
+ "step": 280,
226
+ "total_flos": 8.5248064484352e+16,
227
+ "train_loss": 0.1071862239856273,
228
+ "train_runtime": 140.5527,
229
+ "train_samples_per_second": 7.826,
230
+ "train_steps_per_second": 1.992
231
  }
232
  ],
233
+ "max_steps": 280,
234
  "num_train_epochs": 20,
235
+ "total_flos": 8.5248064484352e+16,
236
  "trial_name": null,
237
  "trial_params": null
238
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5a7444871ccfb3c61a6a37bb117b483095c240103b17ea642d8889548d76bc4
3
  size 3963
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c49aa2c0a4b308580ecc8e9ea52b2bab03884419dd31d6c0fc3bf7ba3fc18f2b
3
  size 3963