dima806 commited on
Commit
bb19cb7
1 Parent(s): d563703

Upload folder using huggingface_hub

Browse files
checkpoint-10945/config.json CHANGED
@@ -224,5 +224,5 @@
224
  "problem_type": "single_label_classification",
225
  "qkv_bias": true,
226
  "torch_dtype": "float32",
227
- "transformers_version": "4.39.2"
228
  }
 
224
  "problem_type": "single_label_classification",
225
  "qkv_bias": true,
226
  "torch_dtype": "float32",
227
+ "transformers_version": "4.39.3"
228
  }
checkpoint-10945/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ccf47aecf2a5fe3fd2c3f2724fbbfb6295e0d057bb189850fbdf7f05b8d977d3
3
  size 343525432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6df9d6bd9f12074fbbeba04adf05e42f2d5b750360625482975e711cacae747a
3
  size 343525432
checkpoint-10945/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f34f9061525e3d68314e07eba8fc9c7c851ebcc9f5ec6a69ea45435c3e3c6c7a
3
  size 687171333
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8379a7676830aca29c3492b682fdeebb23b3720e5d1b01a041d42a67c5b9d2a
3
  size 687171333
checkpoint-10945/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.6230026483535767,
3
  "best_model_checkpoint": "mushrooms_image_detection/checkpoint-10945",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
@@ -10,158 +10,158 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.05,
13
- "grad_norm": 5.758909702301025,
14
  "learning_rate": 1.9173932996787516e-07,
15
- "loss": 0.7238,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.09,
20
- "grad_norm": 7.06810188293457,
21
  "learning_rate": 1.825608077099587e-07,
22
- "loss": 0.7267,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.14,
27
- "grad_norm": 6.429927349090576,
28
  "learning_rate": 1.733822854520422e-07,
29
- "loss": 0.711,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.18,
34
- "grad_norm": 7.55098819732666,
35
  "learning_rate": 1.6420376319412576e-07,
36
- "loss": 0.7174,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.23,
41
- "grad_norm": 7.272024154663086,
42
  "learning_rate": 1.5502524093620926e-07,
43
- "loss": 0.713,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.27,
48
- "grad_norm": 8.493428230285645,
49
  "learning_rate": 1.458467186782928e-07,
50
- "loss": 0.6996,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.32,
55
- "grad_norm": 4.434696197509766,
56
  "learning_rate": 1.366681964203763e-07,
57
- "loss": 0.7165,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 0.37,
62
- "grad_norm": 6.052495956420898,
63
  "learning_rate": 1.2748967416245983e-07,
64
- "loss": 0.7169,
65
  "step": 4000
66
  },
67
  {
68
  "epoch": 0.41,
69
- "grad_norm": 10.02051067352295,
70
  "learning_rate": 1.1831115190454337e-07,
71
- "loss": 0.6994,
72
  "step": 4500
73
  },
74
  {
75
  "epoch": 0.46,
76
- "grad_norm": 4.502712726593018,
77
  "learning_rate": 1.0913262964662688e-07,
78
- "loss": 0.7075,
79
  "step": 5000
80
  },
81
  {
82
  "epoch": 0.5,
83
- "grad_norm": 4.787944793701172,
84
  "learning_rate": 9.995410738871042e-08,
85
- "loss": 0.7136,
86
  "step": 5500
87
  },
88
  {
89
  "epoch": 0.55,
90
- "grad_norm": 8.738495826721191,
91
  "learning_rate": 9.077558513079394e-08,
92
- "loss": 0.6976,
93
  "step": 6000
94
  },
95
  {
96
  "epoch": 0.59,
97
- "grad_norm": 6.709692001342773,
98
  "learning_rate": 8.159706287287747e-08,
99
- "loss": 0.6994,
100
  "step": 6500
101
  },
102
  {
103
  "epoch": 0.64,
104
- "grad_norm": 2.5347442626953125,
105
  "learning_rate": 7.241854061496099e-08,
106
- "loss": 0.6996,
107
  "step": 7000
108
  },
109
  {
110
  "epoch": 0.69,
111
- "grad_norm": 5.286170482635498,
112
  "learning_rate": 6.32400183570445e-08,
113
- "loss": 0.6961,
114
  "step": 7500
115
  },
116
  {
117
  "epoch": 0.73,
118
- "grad_norm": 5.30819034576416,
119
  "learning_rate": 5.406149609912804e-08,
120
- "loss": 0.6897,
121
  "step": 8000
122
  },
123
  {
124
  "epoch": 0.78,
125
- "grad_norm": 7.743193626403809,
126
  "learning_rate": 4.488297384121156e-08,
127
- "loss": 0.6855,
128
  "step": 8500
129
  },
130
  {
131
  "epoch": 0.82,
132
- "grad_norm": 8.52515697479248,
133
  "learning_rate": 3.5704451583295086e-08,
134
- "loss": 0.6966,
135
  "step": 9000
136
  },
137
  {
138
  "epoch": 0.87,
139
- "grad_norm": 5.206400394439697,
140
  "learning_rate": 2.6525929325378617e-08,
141
- "loss": 0.7043,
142
  "step": 9500
143
  },
144
  {
145
  "epoch": 0.91,
146
- "grad_norm": 6.084430694580078,
147
  "learning_rate": 1.7347407067462138e-08,
148
- "loss": 0.6943,
149
  "step": 10000
150
  },
151
  {
152
  "epoch": 0.96,
153
- "grad_norm": 8.045140266418457,
154
  "learning_rate": 8.168884809545663e-09,
155
- "loss": 0.6869,
156
  "step": 10500
157
  },
158
  {
159
  "epoch": 1.0,
160
- "eval_accuracy": 0.8854163097481583,
161
- "eval_loss": 0.6230026483535767,
162
- "eval_runtime": 2891.1403,
163
- "eval_samples_per_second": 80.757,
164
- "eval_steps_per_second": 10.095,
165
  "step": 10945
166
  }
167
  ],
 
1
  {
2
+ "best_metric": 0.6021606922149658,
3
  "best_model_checkpoint": "mushrooms_image_detection/checkpoint-10945",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.05,
13
+ "grad_norm": 5.143975734710693,
14
  "learning_rate": 1.9173932996787516e-07,
15
+ "loss": 0.6876,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.09,
20
+ "grad_norm": 5.595354080200195,
21
  "learning_rate": 1.825608077099587e-07,
22
+ "loss": 0.705,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.14,
27
+ "grad_norm": 8.542109489440918,
28
  "learning_rate": 1.733822854520422e-07,
29
+ "loss": 0.6908,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.18,
34
+ "grad_norm": 5.49858283996582,
35
  "learning_rate": 1.6420376319412576e-07,
36
+ "loss": 0.6763,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.23,
41
+ "grad_norm": 5.070239067077637,
42
  "learning_rate": 1.5502524093620926e-07,
43
+ "loss": 0.6807,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.27,
48
+ "grad_norm": 3.0705084800720215,
49
  "learning_rate": 1.458467186782928e-07,
50
+ "loss": 0.6879,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.32,
55
+ "grad_norm": 3.836571455001831,
56
  "learning_rate": 1.366681964203763e-07,
57
+ "loss": 0.69,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 0.37,
62
+ "grad_norm": 7.066412448883057,
63
  "learning_rate": 1.2748967416245983e-07,
64
+ "loss": 0.6808,
65
  "step": 4000
66
  },
67
  {
68
  "epoch": 0.41,
69
+ "grad_norm": 5.1906328201293945,
70
  "learning_rate": 1.1831115190454337e-07,
71
+ "loss": 0.6842,
72
  "step": 4500
73
  },
74
  {
75
  "epoch": 0.46,
76
+ "grad_norm": 6.5265703201293945,
77
  "learning_rate": 1.0913262964662688e-07,
78
+ "loss": 0.6911,
79
  "step": 5000
80
  },
81
  {
82
  "epoch": 0.5,
83
+ "grad_norm": 8.26229190826416,
84
  "learning_rate": 9.995410738871042e-08,
85
+ "loss": 0.6743,
86
  "step": 5500
87
  },
88
  {
89
  "epoch": 0.55,
90
+ "grad_norm": 5.895538330078125,
91
  "learning_rate": 9.077558513079394e-08,
92
+ "loss": 0.6734,
93
  "step": 6000
94
  },
95
  {
96
  "epoch": 0.59,
97
+ "grad_norm": 9.030574798583984,
98
  "learning_rate": 8.159706287287747e-08,
99
+ "loss": 0.6718,
100
  "step": 6500
101
  },
102
  {
103
  "epoch": 0.64,
104
+ "grad_norm": 7.243845462799072,
105
  "learning_rate": 7.241854061496099e-08,
106
+ "loss": 0.6698,
107
  "step": 7000
108
  },
109
  {
110
  "epoch": 0.69,
111
+ "grad_norm": 5.422345161437988,
112
  "learning_rate": 6.32400183570445e-08,
113
+ "loss": 0.6627,
114
  "step": 7500
115
  },
116
  {
117
  "epoch": 0.73,
118
+ "grad_norm": 3.86919903755188,
119
  "learning_rate": 5.406149609912804e-08,
120
+ "loss": 0.667,
121
  "step": 8000
122
  },
123
  {
124
  "epoch": 0.78,
125
+ "grad_norm": 8.272964477539062,
126
  "learning_rate": 4.488297384121156e-08,
127
+ "loss": 0.6542,
128
  "step": 8500
129
  },
130
  {
131
  "epoch": 0.82,
132
+ "grad_norm": 7.44323205947876,
133
  "learning_rate": 3.5704451583295086e-08,
134
+ "loss": 0.6729,
135
  "step": 9000
136
  },
137
  {
138
  "epoch": 0.87,
139
+ "grad_norm": 3.3304898738861084,
140
  "learning_rate": 2.6525929325378617e-08,
141
+ "loss": 0.6822,
142
  "step": 9500
143
  },
144
  {
145
  "epoch": 0.91,
146
+ "grad_norm": 7.638361930847168,
147
  "learning_rate": 1.7347407067462138e-08,
148
+ "loss": 0.6749,
149
  "step": 10000
150
  },
151
  {
152
  "epoch": 0.96,
153
+ "grad_norm": 4.384842395782471,
154
  "learning_rate": 8.168884809545663e-09,
155
+ "loss": 0.6733,
156
  "step": 10500
157
  },
158
  {
159
  "epoch": 1.0,
160
+ "eval_accuracy": 0.8896693506938496,
161
+ "eval_loss": 0.6021606922149658,
162
+ "eval_runtime": 3122.8795,
163
+ "eval_samples_per_second": 74.764,
164
+ "eval_steps_per_second": 9.346,
165
  "step": 10945
166
  }
167
  ],
config.json CHANGED
@@ -224,5 +224,5 @@
224
  "problem_type": "single_label_classification",
225
  "qkv_bias": true,
226
  "torch_dtype": "float32",
227
- "transformers_version": "4.39.2"
228
  }
 
224
  "problem_type": "single_label_classification",
225
  "qkv_bias": true,
226
  "torch_dtype": "float32",
227
+ "transformers_version": "4.39.3"
228
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ccf47aecf2a5fe3fd2c3f2724fbbfb6295e0d057bb189850fbdf7f05b8d977d3
3
  size 343525432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6df9d6bd9f12074fbbeba04adf05e42f2d5b750360625482975e711cacae747a
3
  size 343525432