pittawat commited on
Commit
41636df
1 Parent(s): 44bb136

🍻 cheers

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 4.0,
3
- "eval_accuracy": 1.0,
4
- "eval_loss": 0.38402849435806274,
5
- "eval_runtime": 1.7644,
6
- "eval_samples_per_second": 117.888,
7
- "eval_steps_per_second": 7.368,
8
- "total_flos": 3.22436019290112e+17,
9
- "train_loss": 0.9762612545129025,
10
- "train_runtime": 74.7912,
11
- "train_samples_per_second": 55.622,
12
- "train_steps_per_second": 1.765
13
  }
 
1
  {
2
  "epoch": 4.0,
3
+ "eval_accuracy": 0.9572649572649573,
4
+ "eval_loss": 0.3159617781639099,
5
+ "eval_runtime": 1.9143,
6
+ "eval_samples_per_second": 122.237,
7
+ "eval_steps_per_second": 7.836,
8
+ "total_flos": 7.25481043402752e+17,
9
+ "train_loss": 0.6950366432602341,
10
+ "train_runtime": 183.7888,
11
+ "train_samples_per_second": 50.928,
12
+ "train_steps_per_second": 1.611
13
  }
runs/Jan12_00-14-49_7ecde4810381/events.out.tfevents.1705018829.7ecde4810381.24.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1abb09f82b29639033ec2d8840fe5f97bcc0dc901e6545208ddcab894e7d997
3
+ size 363
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 4.0,
3
- "eval_accuracy": 1.0,
4
- "eval_loss": 0.38402849435806274,
5
- "eval_runtime": 1.7644,
6
- "eval_samples_per_second": 117.888,
7
- "eval_steps_per_second": 7.368
8
  }
 
1
  {
2
  "epoch": 4.0,
3
+ "eval_accuracy": 0.9572649572649573,
4
+ "eval_loss": 0.3159617781639099,
5
+ "eval_runtime": 1.9143,
6
+ "eval_samples_per_second": 122.237,
7
+ "eval_steps_per_second": 7.836
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 4.0,
3
- "total_flos": 3.22436019290112e+17,
4
- "train_loss": 0.9762612545129025,
5
- "train_runtime": 74.7912,
6
- "train_samples_per_second": 55.622,
7
- "train_steps_per_second": 1.765
8
  }
 
1
  {
2
  "epoch": 4.0,
3
+ "total_flos": 7.25481043402752e+17,
4
+ "train_loss": 0.6950366432602341,
5
+ "train_runtime": 183.7888,
6
+ "train_samples_per_second": 50.928,
7
+ "train_steps_per_second": 1.611
8
  }
trainer_state.json CHANGED
@@ -1,112 +1,217 @@
1
  {
2
- "best_metric": 0.38402849435806274,
3
- "best_model_checkpoint": "./vit-base-uppercase-english-characters/checkpoint-100",
4
  "epoch": 4.0,
5
- "global_step": 132,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.3,
12
- "learning_rate": 0.00018484848484848484,
13
- "loss": 3.0027,
14
  "step": 10
15
  },
16
  {
17
- "epoch": 0.61,
18
- "learning_rate": 0.00016969696969696972,
19
- "loss": 2.2789,
20
  "step": 20
21
  },
22
  {
23
- "epoch": 0.91,
24
- "learning_rate": 0.00015454545454545454,
25
- "loss": 1.6762,
26
  "step": 30
27
  },
28
  {
29
- "epoch": 1.21,
30
- "learning_rate": 0.0001393939393939394,
31
- "loss": 1.2222,
32
  "step": 40
33
  },
34
  {
35
- "epoch": 1.52,
36
- "learning_rate": 0.00012424242424242425,
37
- "loss": 0.9241,
38
  "step": 50
39
  },
40
  {
41
- "epoch": 1.82,
42
- "learning_rate": 0.00010909090909090909,
43
- "loss": 0.7407,
44
  "step": 60
45
  },
46
  {
47
- "epoch": 2.12,
48
- "learning_rate": 9.393939393939395e-05,
49
- "loss": 0.5808,
50
  "step": 70
51
  },
52
  {
53
- "epoch": 2.42,
54
- "learning_rate": 7.878787878787879e-05,
55
- "loss": 0.4945,
56
  "step": 80
57
  },
58
  {
59
- "epoch": 2.73,
60
- "learning_rate": 6.363636363636364e-05,
61
- "loss": 0.4364,
62
  "step": 90
63
  },
64
  {
65
- "epoch": 3.03,
66
- "learning_rate": 4.848484848484849e-05,
67
- "loss": 0.3936,
68
  "step": 100
69
  },
70
  {
71
- "epoch": 3.03,
72
- "eval_accuracy": 1.0,
73
- "eval_loss": 0.38402849435806274,
74
- "eval_runtime": 1.6842,
75
- "eval_samples_per_second": 123.504,
76
- "eval_steps_per_second": 7.719,
77
  "step": 100
78
  },
79
  {
80
- "epoch": 3.33,
81
- "learning_rate": 3.3333333333333335e-05,
82
- "loss": 0.3722,
83
  "step": 110
84
  },
85
  {
86
- "epoch": 3.64,
87
- "learning_rate": 1.8181818181818182e-05,
88
- "loss": 0.3534,
89
  "step": 120
90
  },
91
  {
92
- "epoch": 3.94,
93
- "learning_rate": 3.0303030303030305e-06,
94
- "loss": 0.3421,
95
  "step": 130
96
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
97
  {
98
  "epoch": 4.0,
99
- "step": 132,
100
- "total_flos": 3.22436019290112e+17,
101
- "train_loss": 0.9762612545129025,
102
- "train_runtime": 74.7912,
103
- "train_samples_per_second": 55.622,
104
- "train_steps_per_second": 1.765
105
  }
106
  ],
107
- "max_steps": 132,
108
  "num_train_epochs": 4,
109
- "total_flos": 3.22436019290112e+17,
110
  "trial_name": null,
111
  "trial_params": null
112
  }
 
1
  {
2
+ "best_metric": 0.3159617781639099,
3
+ "best_model_checkpoint": "./vit-base-uppercase-english-characters/checkpoint-200",
4
  "epoch": 4.0,
5
+ "global_step": 296,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.14,
12
+ "learning_rate": 0.00019324324324324326,
13
+ "loss": 3.1876,
14
  "step": 10
15
  },
16
  {
17
+ "epoch": 0.27,
18
+ "learning_rate": 0.0001864864864864865,
19
+ "loss": 2.7336,
20
  "step": 20
21
  },
22
  {
23
+ "epoch": 0.41,
24
+ "learning_rate": 0.00017972972972972974,
25
+ "loss": 2.2045,
26
  "step": 30
27
  },
28
  {
29
+ "epoch": 0.54,
30
+ "learning_rate": 0.000172972972972973,
31
+ "loss": 1.7453,
32
  "step": 40
33
  },
34
  {
35
+ "epoch": 0.68,
36
+ "learning_rate": 0.00016621621621621622,
37
+ "loss": 1.4371,
38
  "step": 50
39
  },
40
  {
41
+ "epoch": 0.81,
42
+ "learning_rate": 0.00015945945945945947,
43
+ "loss": 1.1114,
44
  "step": 60
45
  },
46
  {
47
+ "epoch": 0.95,
48
+ "learning_rate": 0.0001527027027027027,
49
+ "loss": 0.9965,
50
  "step": 70
51
  },
52
  {
53
+ "epoch": 1.08,
54
+ "learning_rate": 0.00014594594594594595,
55
+ "loss": 0.7593,
56
  "step": 80
57
  },
58
  {
59
+ "epoch": 1.22,
60
+ "learning_rate": 0.0001391891891891892,
61
+ "loss": 0.6622,
62
  "step": 90
63
  },
64
  {
65
+ "epoch": 1.35,
66
+ "learning_rate": 0.00013243243243243243,
67
+ "loss": 0.5944,
68
  "step": 100
69
  },
70
  {
71
+ "epoch": 1.35,
72
+ "eval_accuracy": 0.9487179487179487,
73
+ "eval_loss": 0.5538277626037598,
74
+ "eval_runtime": 1.9221,
75
+ "eval_samples_per_second": 121.742,
76
+ "eval_steps_per_second": 7.804,
77
  "step": 100
78
  },
79
  {
80
+ "epoch": 1.49,
81
+ "learning_rate": 0.00012567567567567568,
82
+ "loss": 0.4882,
83
  "step": 110
84
  },
85
  {
86
+ "epoch": 1.62,
87
+ "learning_rate": 0.00011891891891891893,
88
+ "loss": 0.46,
89
  "step": 120
90
  },
91
  {
92
+ "epoch": 1.76,
93
+ "learning_rate": 0.00011216216216216217,
94
+ "loss": 0.4453,
95
  "step": 130
96
  },
97
+ {
98
+ "epoch": 1.89,
99
+ "learning_rate": 0.0001054054054054054,
100
+ "loss": 0.4454,
101
+ "step": 140
102
+ },
103
+ {
104
+ "epoch": 2.03,
105
+ "learning_rate": 9.864864864864865e-05,
106
+ "loss": 0.3618,
107
+ "step": 150
108
+ },
109
+ {
110
+ "epoch": 2.16,
111
+ "learning_rate": 9.18918918918919e-05,
112
+ "loss": 0.3138,
113
+ "step": 160
114
+ },
115
+ {
116
+ "epoch": 2.3,
117
+ "learning_rate": 8.513513513513514e-05,
118
+ "loss": 0.2605,
119
+ "step": 170
120
+ },
121
+ {
122
+ "epoch": 2.43,
123
+ "learning_rate": 7.837837837837838e-05,
124
+ "loss": 0.292,
125
+ "step": 180
126
+ },
127
+ {
128
+ "epoch": 2.57,
129
+ "learning_rate": 7.162162162162162e-05,
130
+ "loss": 0.2502,
131
+ "step": 190
132
+ },
133
+ {
134
+ "epoch": 2.7,
135
+ "learning_rate": 6.486486486486487e-05,
136
+ "loss": 0.2241,
137
+ "step": 200
138
+ },
139
+ {
140
+ "epoch": 2.7,
141
+ "eval_accuracy": 0.9572649572649573,
142
+ "eval_loss": 0.3159617781639099,
143
+ "eval_runtime": 1.8767,
144
+ "eval_samples_per_second": 124.688,
145
+ "eval_steps_per_second": 7.993,
146
+ "step": 200
147
+ },
148
+ {
149
+ "epoch": 2.84,
150
+ "learning_rate": 5.8108108108108105e-05,
151
+ "loss": 0.2273,
152
+ "step": 210
153
+ },
154
+ {
155
+ "epoch": 2.97,
156
+ "learning_rate": 5.135135135135135e-05,
157
+ "loss": 0.2002,
158
+ "step": 220
159
+ },
160
+ {
161
+ "epoch": 3.11,
162
+ "learning_rate": 4.4594594594594596e-05,
163
+ "loss": 0.163,
164
+ "step": 230
165
+ },
166
+ {
167
+ "epoch": 3.24,
168
+ "learning_rate": 3.783783783783784e-05,
169
+ "loss": 0.1654,
170
+ "step": 240
171
+ },
172
+ {
173
+ "epoch": 3.38,
174
+ "learning_rate": 3.108108108108108e-05,
175
+ "loss": 0.1569,
176
+ "step": 250
177
+ },
178
+ {
179
+ "epoch": 3.51,
180
+ "learning_rate": 2.4324324324324327e-05,
181
+ "loss": 0.1507,
182
+ "step": 260
183
+ },
184
+ {
185
+ "epoch": 3.65,
186
+ "learning_rate": 1.756756756756757e-05,
187
+ "loss": 0.1543,
188
+ "step": 270
189
+ },
190
+ {
191
+ "epoch": 3.78,
192
+ "learning_rate": 1.0810810810810812e-05,
193
+ "loss": 0.158,
194
+ "step": 280
195
+ },
196
+ {
197
+ "epoch": 3.92,
198
+ "learning_rate": 4.0540540540540545e-06,
199
+ "loss": 0.14,
200
+ "step": 290
201
+ },
202
  {
203
  "epoch": 4.0,
204
+ "step": 296,
205
+ "total_flos": 7.25481043402752e+17,
206
+ "train_loss": 0.6950366432602341,
207
+ "train_runtime": 183.7888,
208
+ "train_samples_per_second": 50.928,
209
+ "train_steps_per_second": 1.611
210
  }
211
  ],
212
+ "max_steps": 296,
213
  "num_train_epochs": 4,
214
+ "total_flos": 7.25481043402752e+17,
215
  "trial_name": null,
216
  "trial_params": null
217
  }