Upload folder using huggingface_hub

#2
by Mirkat - opened
Files changed (6) hide show
  1. optimizer.pt +2 -2
  2. pytorch_model.bin +1 -1
  3. rng_state.pth +1 -1
  4. scheduler.pt +1 -1
  5. trainer_state.json +78 -177
  6. training_args.bin +1 -1
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3872c3bca0bcaada8b7c91afab197a88f39c328e8aaded23ce282e996b32aac0
3
- size 686587077
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e24c2340e30017c7624660104e3a0fb850bbd378a2f7509d3004b44a447ce4f3
3
+ size 686586885
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64b6d2b1634d4e5818b3b03ba56b6ff5ea6a172e5705aad392ee633558360106
3
  size 343302829
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6c092d7c5b9f453b9c06ae90b5869ac471bb7a110aee92da14819d546852281
3
  size 343302829
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:132429c3ef48097d659f3fa34f0ca82d09f907b2d0b58363bcfefa9ddb19fe7f
3
  size 13553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8214c01f27f2aeae1e56fc7a28278e26d2d258088ec2bdf3bdc701698ad3524
3
  size 13553
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ed8a156a22c309bb91c33d910110b63f1c190e1e24dadfe22b621d95df2fa8a
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e9d1478932d95f604c248a1fe1362a1d07bf90d5ca17e1579a67752b11f2fc2
3
  size 627
trainer_state.json CHANGED
@@ -1,247 +1,148 @@
1
  {
2
- "best_metric": 0.43153366446495056,
3
- "best_model_checkpoint": "./plant-classification/checkpoint-280",
4
- "epoch": 3.5,
5
- "global_step": 280,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.12,
12
- "learning_rate": 0.00019375000000000002,
13
- "loss": 2.4618,
14
  "step": 10
15
  },
16
  {
17
- "epoch": 0.25,
18
- "learning_rate": 0.0001875,
19
- "loss": 2.0277,
20
  "step": 20
21
  },
22
  {
23
- "epoch": 0.38,
24
- "learning_rate": 0.00018125000000000001,
25
- "loss": 1.6392,
26
  "step": 30
27
  },
28
  {
29
- "epoch": 0.5,
30
- "learning_rate": 0.000175,
31
- "loss": 1.3747,
32
  "step": 40
33
  },
34
  {
35
- "epoch": 0.5,
36
- "eval_accuracy": 0.7626168224299066,
37
- "eval_loss": 1.1831709146499634,
38
- "eval_runtime": 384.9557,
39
- "eval_samples_per_second": 1.39,
40
- "eval_steps_per_second": 0.174,
41
  "step": 40
42
  },
43
  {
44
- "epoch": 0.62,
45
- "learning_rate": 0.00016875,
46
- "loss": 1.2425,
47
  "step": 50
48
  },
49
  {
50
- "epoch": 0.75,
51
- "learning_rate": 0.00016250000000000002,
52
- "loss": 1.1063,
53
  "step": 60
54
  },
55
  {
56
- "epoch": 0.88,
57
- "learning_rate": 0.00015625,
58
- "loss": 0.9224,
59
  "step": 70
60
  },
61
  {
62
- "epoch": 1.0,
63
- "learning_rate": 0.00015000000000000001,
64
- "loss": 0.7905,
65
  "step": 80
66
  },
67
  {
68
- "epoch": 1.0,
69
- "eval_accuracy": 0.8130841121495327,
70
- "eval_loss": 0.7577788233757019,
71
- "eval_runtime": 381.7049,
72
- "eval_samples_per_second": 1.402,
73
- "eval_steps_per_second": 0.176,
74
  "step": 80
75
  },
76
  {
77
- "epoch": 1.12,
78
- "learning_rate": 0.00014375,
79
- "loss": 0.6613,
80
  "step": 90
81
  },
82
  {
83
- "epoch": 1.25,
84
- "learning_rate": 0.0001375,
85
- "loss": 0.6946,
86
  "step": 100
87
  },
88
  {
89
- "epoch": 1.38,
90
- "learning_rate": 0.00013125000000000002,
91
- "loss": 0.5187,
92
  "step": 110
93
  },
94
  {
95
- "epoch": 1.5,
96
- "learning_rate": 0.000125,
97
- "loss": 0.5223,
98
  "step": 120
99
  },
100
  {
101
- "epoch": 1.5,
102
- "eval_accuracy": 0.8186915887850468,
103
- "eval_loss": 0.6094576120376587,
104
- "eval_runtime": 389.3932,
105
- "eval_samples_per_second": 1.374,
106
- "eval_steps_per_second": 0.172,
107
  "step": 120
108
  },
109
  {
110
- "epoch": 1.62,
111
- "learning_rate": 0.00011875,
112
- "loss": 0.5048,
113
  "step": 130
114
  },
115
  {
116
- "epoch": 1.75,
117
- "learning_rate": 0.00011250000000000001,
118
- "loss": 0.5559,
119
  "step": 140
120
  },
121
  {
122
- "epoch": 1.88,
123
- "learning_rate": 0.00010625000000000001,
124
- "loss": 0.4757,
125
  "step": 150
126
  },
127
  {
128
- "epoch": 2.0,
129
- "learning_rate": 0.0001,
130
- "loss": 0.3683,
131
  "step": 160
132
  },
133
  {
134
- "epoch": 2.0,
135
- "eval_accuracy": 0.8542056074766355,
136
- "eval_loss": 0.5075709819793701,
137
- "eval_runtime": 384.1646,
138
- "eval_samples_per_second": 1.393,
139
- "eval_steps_per_second": 0.174,
140
  "step": 160
141
- },
142
- {
143
- "epoch": 2.12,
144
- "learning_rate": 9.375e-05,
145
- "loss": 0.3126,
146
- "step": 170
147
- },
148
- {
149
- "epoch": 2.25,
150
- "learning_rate": 8.75e-05,
151
- "loss": 0.3093,
152
- "step": 180
153
- },
154
- {
155
- "epoch": 2.38,
156
- "learning_rate": 8.125000000000001e-05,
157
- "loss": 0.3063,
158
- "step": 190
159
- },
160
- {
161
- "epoch": 2.5,
162
- "learning_rate": 7.500000000000001e-05,
163
- "loss": 0.2401,
164
- "step": 200
165
- },
166
- {
167
- "epoch": 2.5,
168
- "eval_accuracy": 0.8467289719626169,
169
- "eval_loss": 0.4515593349933624,
170
- "eval_runtime": 374.8793,
171
- "eval_samples_per_second": 1.427,
172
- "eval_steps_per_second": 0.179,
173
- "step": 200
174
- },
175
- {
176
- "epoch": 2.62,
177
- "learning_rate": 6.875e-05,
178
- "loss": 0.3209,
179
- "step": 210
180
- },
181
- {
182
- "epoch": 2.75,
183
- "learning_rate": 6.25e-05,
184
- "loss": 0.2538,
185
- "step": 220
186
- },
187
- {
188
- "epoch": 2.88,
189
- "learning_rate": 5.6250000000000005e-05,
190
- "loss": 0.2671,
191
- "step": 230
192
- },
193
- {
194
- "epoch": 3.0,
195
- "learning_rate": 5e-05,
196
- "loss": 0.2688,
197
- "step": 240
198
- },
199
- {
200
- "epoch": 3.0,
201
- "eval_accuracy": 0.8598130841121495,
202
- "eval_loss": 0.4518713057041168,
203
- "eval_runtime": 371.598,
204
- "eval_samples_per_second": 1.44,
205
- "eval_steps_per_second": 0.18,
206
- "step": 240
207
- },
208
- {
209
- "epoch": 3.12,
210
- "learning_rate": 4.375e-05,
211
- "loss": 0.1702,
212
- "step": 250
213
- },
214
- {
215
- "epoch": 3.25,
216
- "learning_rate": 3.7500000000000003e-05,
217
- "loss": 0.1993,
218
- "step": 260
219
- },
220
- {
221
- "epoch": 3.38,
222
- "learning_rate": 3.125e-05,
223
- "loss": 0.218,
224
- "step": 270
225
- },
226
- {
227
- "epoch": 3.5,
228
- "learning_rate": 2.5e-05,
229
- "loss": 0.1583,
230
- "step": 280
231
- },
232
- {
233
- "epoch": 3.5,
234
- "eval_accuracy": 0.874766355140187,
235
- "eval_loss": 0.43153366446495056,
236
- "eval_runtime": 380.0584,
237
- "eval_samples_per_second": 1.408,
238
- "eval_steps_per_second": 0.176,
239
- "step": 280
240
  }
241
  ],
242
- "max_steps": 320,
243
- "num_train_epochs": 4,
244
- "total_flos": 3.467364497947607e+17,
245
  "trial_name": null,
246
  "trial_params": null
247
  }
 
1
  {
2
+ "best_metric": 0.5926051735877991,
3
+ "best_model_checkpoint": "./plant-classification/checkpoint-160",
4
+ "epoch": 1.951219512195122,
5
+ "global_step": 160,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.12,
12
+ "learning_rate": 0.0001878048780487805,
13
+ "loss": 2.4403,
14
  "step": 10
15
  },
16
  {
17
+ "epoch": 0.24,
18
+ "learning_rate": 0.000175609756097561,
19
+ "loss": 1.9498,
20
  "step": 20
21
  },
22
  {
23
+ "epoch": 0.37,
24
+ "learning_rate": 0.00016341463414634147,
25
+ "loss": 1.5422,
26
  "step": 30
27
  },
28
  {
29
+ "epoch": 0.49,
30
+ "learning_rate": 0.00015121951219512197,
31
+ "loss": 1.2802,
32
  "step": 40
33
  },
34
  {
35
+ "epoch": 0.49,
36
+ "eval_accuracy": 0.7532467532467533,
37
+ "eval_loss": 1.1777054071426392,
38
+ "eval_runtime": 245.0854,
39
+ "eval_samples_per_second": 2.199,
40
+ "eval_steps_per_second": 0.277,
41
  "step": 40
42
  },
43
  {
44
+ "epoch": 0.61,
45
+ "learning_rate": 0.00013902439024390245,
46
+ "loss": 1.1818,
47
  "step": 50
48
  },
49
  {
50
+ "epoch": 0.73,
51
+ "learning_rate": 0.00012682926829268293,
52
+ "loss": 1.0576,
53
  "step": 60
54
  },
55
  {
56
+ "epoch": 0.85,
57
+ "learning_rate": 0.00011463414634146342,
58
+ "loss": 0.9448,
59
  "step": 70
60
  },
61
  {
62
+ "epoch": 0.98,
63
+ "learning_rate": 0.0001024390243902439,
64
+ "loss": 0.9498,
65
  "step": 80
66
  },
67
  {
68
+ "epoch": 0.98,
69
+ "eval_accuracy": 0.8311688311688312,
70
+ "eval_loss": 0.820961058139801,
71
+ "eval_runtime": 244.7769,
72
+ "eval_samples_per_second": 2.202,
73
+ "eval_steps_per_second": 0.278,
74
  "step": 80
75
  },
76
  {
77
+ "epoch": 1.1,
78
+ "learning_rate": 9.02439024390244e-05,
79
+ "loss": 0.6939,
80
  "step": 90
81
  },
82
  {
83
+ "epoch": 1.22,
84
+ "learning_rate": 7.804878048780489e-05,
85
+ "loss": 0.6009,
86
  "step": 100
87
  },
88
  {
89
+ "epoch": 1.34,
90
+ "learning_rate": 6.585365853658538e-05,
91
+ "loss": 0.593,
92
  "step": 110
93
  },
94
  {
95
+ "epoch": 1.46,
96
+ "learning_rate": 5.365853658536586e-05,
97
+ "loss": 0.5132,
98
  "step": 120
99
  },
100
  {
101
+ "epoch": 1.46,
102
+ "eval_accuracy": 0.8330241187384044,
103
+ "eval_loss": 0.6491296887397766,
104
+ "eval_runtime": 247.5801,
105
+ "eval_samples_per_second": 2.177,
106
+ "eval_steps_per_second": 0.275,
107
  "step": 120
108
  },
109
  {
110
+ "epoch": 1.59,
111
+ "learning_rate": 4.146341463414634e-05,
112
+ "loss": 0.5321,
113
  "step": 130
114
  },
115
  {
116
+ "epoch": 1.71,
117
+ "learning_rate": 2.926829268292683e-05,
118
+ "loss": 0.4869,
119
  "step": 140
120
  },
121
  {
122
+ "epoch": 1.83,
123
+ "learning_rate": 1.707317073170732e-05,
124
+ "loss": 0.4651,
125
  "step": 150
126
  },
127
  {
128
+ "epoch": 1.95,
129
+ "learning_rate": 4.8780487804878055e-06,
130
+ "loss": 0.5354,
131
  "step": 160
132
  },
133
  {
134
+ "epoch": 1.95,
135
+ "eval_accuracy": 0.8571428571428571,
136
+ "eval_loss": 0.5926051735877991,
137
+ "eval_runtime": 248.1335,
138
+ "eval_samples_per_second": 2.172,
139
+ "eval_steps_per_second": 0.274,
140
  "step": 160
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
141
  }
142
  ],
143
+ "max_steps": 164,
144
+ "num_train_epochs": 2,
145
+ "total_flos": 1.9809082826897818e+17,
146
  "trial_name": null,
147
  "trial_params": null
148
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aaa90b2bf99e43bd879b69acbb4d88ab9a0137685671e23de8df26be9573fb3d
3
  size 3899
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b235ff0483f9bbab0da85fe4a9ed55d0e6e523372e5e8e176c86ff866cd91f31
3
  size 3899