dima806 commited on
Commit
0f02543
·
verified ·
1 Parent(s): 2c4b167

Upload folder using huggingface_hub

Browse files
checkpoint-12118/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3eaf20bd8c8686fab8a7fa784e48aa41c53e155e7279516f67a0d499a1633c7c
3
  size 345986248
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c063212b1c0b2921499024070d1203cccf9d81b7771aae6406b22d9af98ad45
3
  size 345986248
checkpoint-12118/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63605b7da669cdedc830ee8c17f3d7b4f013f3e433dd1529d44525495945ab24
3
  size 692092933
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d923cbe6b2dae4eddb56d43ebc40cc49f7b0213ccf17f3b45f77935a5757fe40
3
  size 692092933
checkpoint-12118/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 6.000739574432373,
3
  "best_model_checkpoint": "flowers_image_detection/checkpoint-12118",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
@@ -10,188 +10,188 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.0825218682950982,
13
- "grad_norm": 1.7390600442886353,
14
  "learning_rate": 1.9254226052369905e-07,
15
- "loss": 5.9885,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.1650437365901964,
20
- "grad_norm": 1.7211048603057861,
21
  "learning_rate": 1.842558833278091e-07,
22
- "loss": 5.9808,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.2475656048852946,
27
- "grad_norm": 1.73354172706604,
28
  "learning_rate": 1.7596950613191912e-07,
29
- "loss": 5.9877,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.3300874731803928,
34
- "grad_norm": 1.7605706453323364,
35
  "learning_rate": 1.6768312893602916e-07,
36
- "loss": 5.9764,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.412609341475491,
41
- "grad_norm": 2.0977978706359863,
42
  "learning_rate": 1.593967517401392e-07,
43
- "loss": 5.9758,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.4951312097705892,
48
- "grad_norm": 1.792007327079773,
49
  "learning_rate": 1.5111037454424923e-07,
50
- "loss": 5.9702,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.5776530780656874,
55
- "grad_norm": 1.7574431896209717,
56
  "learning_rate": 1.428239973483593e-07,
57
- "loss": 5.9639,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 0.6601749463607856,
62
- "grad_norm": 1.81585693359375,
63
  "learning_rate": 1.3453762015246935e-07,
64
- "loss": 5.9654,
65
  "step": 4000
66
  },
67
  {
68
  "epoch": 0.7426968146558838,
69
- "grad_norm": 1.852972388267517,
70
  "learning_rate": 1.262512429565794e-07,
71
- "loss": 5.9572,
72
  "step": 4500
73
  },
74
  {
75
  "epoch": 0.825218682950982,
76
- "grad_norm": 1.796462893486023,
77
  "learning_rate": 1.1796486576068942e-07,
78
- "loss": 5.9637,
79
  "step": 5000
80
  },
81
  {
82
  "epoch": 0.9077405512460802,
83
- "grad_norm": 1.8212686777114868,
84
  "learning_rate": 1.0967848856479946e-07,
85
- "loss": 5.9616,
86
  "step": 5500
87
  },
88
  {
89
  "epoch": 0.9902624195411784,
90
- "grad_norm": 1.8188484907150269,
91
  "learning_rate": 1.0139211136890951e-07,
92
- "loss": 5.9579,
93
  "step": 6000
94
  },
95
  {
96
  "epoch": 1.0,
97
- "eval_accuracy": 0.6417130919220055,
98
- "eval_loss": 6.009731292724609,
99
- "eval_runtime": 1266.1072,
100
- "eval_samples_per_second": 102.077,
101
- "eval_steps_per_second": 12.76,
102
  "step": 6059
103
  },
104
  {
105
  "epoch": 1.0727842878362766,
106
- "grad_norm": 1.8866934776306152,
107
  "learning_rate": 9.310573417301956e-08,
108
- "loss": 5.9542,
109
  "step": 6500
110
  },
111
  {
112
  "epoch": 1.1553061561313749,
113
- "grad_norm": 1.9183136224746704,
114
  "learning_rate": 8.481935697712959e-08,
115
- "loss": 5.9581,
116
  "step": 7000
117
  },
118
  {
119
  "epoch": 1.237828024426473,
120
- "grad_norm": 1.7592434883117676,
121
  "learning_rate": 7.653297978123964e-08,
122
- "loss": 5.9566,
123
  "step": 7500
124
  },
125
  {
126
  "epoch": 1.320349892721571,
127
- "grad_norm": 1.981501817703247,
128
  "learning_rate": 6.824660258534968e-08,
129
- "loss": 5.9557,
130
  "step": 8000
131
  },
132
  {
133
  "epoch": 1.4028717610166694,
134
- "grad_norm": 1.7875568866729736,
135
  "learning_rate": 5.996022538945973e-08,
136
- "loss": 5.9481,
137
  "step": 8500
138
  },
139
  {
140
  "epoch": 1.4853936293117675,
141
- "grad_norm": 1.689201831817627,
142
  "learning_rate": 5.167384819356977e-08,
143
- "loss": 5.9487,
144
  "step": 9000
145
  },
146
  {
147
  "epoch": 1.5679154976068657,
148
- "grad_norm": 1.760799765586853,
149
  "learning_rate": 4.3387470997679816e-08,
150
- "loss": 5.9511,
151
  "step": 9500
152
  },
153
  {
154
  "epoch": 1.650437365901964,
155
- "grad_norm": 1.7961113452911377,
156
  "learning_rate": 3.510109380178986e-08,
157
- "loss": 5.948,
158
  "step": 10000
159
  },
160
  {
161
  "epoch": 1.7329592341970623,
162
- "grad_norm": 1.9323595762252808,
163
  "learning_rate": 2.68147166058999e-08,
164
- "loss": 5.9534,
165
  "step": 10500
166
  },
167
  {
168
  "epoch": 1.8154811024921604,
169
- "grad_norm": 1.7695621252059937,
170
  "learning_rate": 1.8528339410009945e-08,
171
- "loss": 5.9465,
172
  "step": 11000
173
  },
174
  {
175
  "epoch": 1.8980029707872585,
176
- "grad_norm": 1.840099573135376,
177
  "learning_rate": 1.0241962214119987e-08,
178
- "loss": 5.9464,
179
  "step": 11500
180
  },
181
  {
182
  "epoch": 1.9805248390823569,
183
- "grad_norm": 1.7224979400634766,
184
  "learning_rate": 1.95558501823003e-09,
185
- "loss": 5.9453,
186
  "step": 12000
187
  },
188
  {
189
  "epoch": 2.0,
190
- "eval_accuracy": 0.6448545341999381,
191
- "eval_loss": 6.000739574432373,
192
- "eval_runtime": 1247.3729,
193
- "eval_samples_per_second": 103.61,
194
- "eval_steps_per_second": 12.951,
195
  "step": 12118
196
  }
197
  ],
 
1
  {
2
+ "best_metric": 5.964588165283203,
3
  "best_model_checkpoint": "flowers_image_detection/checkpoint-12118",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.0825218682950982,
13
+ "grad_norm": 1.8450349569320679,
14
  "learning_rate": 1.9254226052369905e-07,
15
+ "loss": 5.9475,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.1650437365901964,
20
+ "grad_norm": 1.7727391719818115,
21
  "learning_rate": 1.842558833278091e-07,
22
+ "loss": 5.948,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.2475656048852946,
27
+ "grad_norm": 1.7900820970535278,
28
  "learning_rate": 1.7596950613191912e-07,
29
+ "loss": 5.9467,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.3300874731803928,
34
+ "grad_norm": 1.6870242357254028,
35
  "learning_rate": 1.6768312893602916e-07,
36
+ "loss": 5.935,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.412609341475491,
41
+ "grad_norm": 1.9448150396347046,
42
  "learning_rate": 1.593967517401392e-07,
43
+ "loss": 5.9367,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.4951312097705892,
48
+ "grad_norm": 1.7643060684204102,
49
  "learning_rate": 1.5111037454424923e-07,
50
+ "loss": 5.9283,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.5776530780656874,
55
+ "grad_norm": 1.7454640865325928,
56
  "learning_rate": 1.428239973483593e-07,
57
+ "loss": 5.9315,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 0.6601749463607856,
62
+ "grad_norm": 1.7440547943115234,
63
  "learning_rate": 1.3453762015246935e-07,
64
+ "loss": 5.9237,
65
  "step": 4000
66
  },
67
  {
68
  "epoch": 0.7426968146558838,
69
+ "grad_norm": 1.7682538032531738,
70
  "learning_rate": 1.262512429565794e-07,
71
+ "loss": 5.9265,
72
  "step": 4500
73
  },
74
  {
75
  "epoch": 0.825218682950982,
76
+ "grad_norm": 1.7519503831863403,
77
  "learning_rate": 1.1796486576068942e-07,
78
+ "loss": 5.9222,
79
  "step": 5000
80
  },
81
  {
82
  "epoch": 0.9077405512460802,
83
+ "grad_norm": 1.7960128784179688,
84
  "learning_rate": 1.0967848856479946e-07,
85
+ "loss": 5.9195,
86
  "step": 5500
87
  },
88
  {
89
  "epoch": 0.9902624195411784,
90
+ "grad_norm": 1.9735090732574463,
91
  "learning_rate": 1.0139211136890951e-07,
92
+ "loss": 5.9239,
93
  "step": 6000
94
  },
95
  {
96
  "epoch": 1.0,
97
+ "eval_accuracy": 0.6516635716496441,
98
+ "eval_loss": 5.973537445068359,
99
+ "eval_runtime": 1279.8379,
100
+ "eval_samples_per_second": 100.982,
101
+ "eval_steps_per_second": 12.623,
102
  "step": 6059
103
  },
104
  {
105
  "epoch": 1.0727842878362766,
106
+ "grad_norm": 1.7479947805404663,
107
  "learning_rate": 9.310573417301956e-08,
108
+ "loss": 5.9212,
109
  "step": 6500
110
  },
111
  {
112
  "epoch": 1.1553061561313749,
113
+ "grad_norm": 1.8694578409194946,
114
  "learning_rate": 8.481935697712959e-08,
115
+ "loss": 5.9106,
116
  "step": 7000
117
  },
118
  {
119
  "epoch": 1.237828024426473,
120
+ "grad_norm": 1.7446856498718262,
121
  "learning_rate": 7.653297978123964e-08,
122
+ "loss": 5.919,
123
  "step": 7500
124
  },
125
  {
126
  "epoch": 1.320349892721571,
127
+ "grad_norm": 1.7331393957138062,
128
  "learning_rate": 6.824660258534968e-08,
129
+ "loss": 5.9144,
130
  "step": 8000
131
  },
132
  {
133
  "epoch": 1.4028717610166694,
134
+ "grad_norm": 1.664704442024231,
135
  "learning_rate": 5.996022538945973e-08,
136
+ "loss": 5.9162,
137
  "step": 8500
138
  },
139
  {
140
  "epoch": 1.4853936293117675,
141
+ "grad_norm": 1.6834096908569336,
142
  "learning_rate": 5.167384819356977e-08,
143
+ "loss": 5.9135,
144
  "step": 9000
145
  },
146
  {
147
  "epoch": 1.5679154976068657,
148
+ "grad_norm": 1.8518224954605103,
149
  "learning_rate": 4.3387470997679816e-08,
150
+ "loss": 5.9141,
151
  "step": 9500
152
  },
153
  {
154
  "epoch": 1.650437365901964,
155
+ "grad_norm": 1.7295408248901367,
156
  "learning_rate": 3.510109380178986e-08,
157
+ "loss": 5.9103,
158
  "step": 10000
159
  },
160
  {
161
  "epoch": 1.7329592341970623,
162
+ "grad_norm": 1.839285135269165,
163
  "learning_rate": 2.68147166058999e-08,
164
+ "loss": 5.9081,
165
  "step": 10500
166
  },
167
  {
168
  "epoch": 1.8154811024921604,
169
+ "grad_norm": 1.8111240863800049,
170
  "learning_rate": 1.8528339410009945e-08,
171
+ "loss": 5.9104,
172
  "step": 11000
173
  },
174
  {
175
  "epoch": 1.8980029707872585,
176
+ "grad_norm": 1.763000249862671,
177
  "learning_rate": 1.0241962214119987e-08,
178
+ "loss": 5.91,
179
  "step": 11500
180
  },
181
  {
182
  "epoch": 1.9805248390823569,
183
+ "grad_norm": 1.8061938285827637,
184
  "learning_rate": 1.95558501823003e-09,
185
+ "loss": 5.9083,
186
  "step": 12000
187
  },
188
  {
189
  "epoch": 2.0,
190
+ "eval_accuracy": 0.6545032497678738,
191
+ "eval_loss": 5.964588165283203,
192
+ "eval_runtime": 1245.0154,
193
+ "eval_samples_per_second": 103.806,
194
+ "eval_steps_per_second": 12.976,
195
  "step": 12118
196
  }
197
  ],
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3eaf20bd8c8686fab8a7fa784e48aa41c53e155e7279516f67a0d499a1633c7c
3
  size 345986248
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c063212b1c0b2921499024070d1203cccf9d81b7771aae6406b22d9af98ad45
3
  size 345986248