dima806 commited on
Commit
c9fce04
1 Parent(s): 90948b7

Upload folder using huggingface_hub

Browse files
checkpoint-11400/config.json ADDED
@@ -0,0 +1,330 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "google/vit-base-patch16-224-in21k",
3
+ "architectures": [
4
+ "ViTForImageClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.0,
7
+ "encoder_stride": 16,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.0,
10
+ "hidden_size": 768,
11
+ "id2label": {
12
+ "0": "acinonyx-jubatus",
13
+ "1": "aethia-cristatella",
14
+ "2": "agalychnis-callidryas",
15
+ "3": "agkistrodon-contortrix",
16
+ "4": "ailuropoda-melanoleuca",
17
+ "5": "ailurus-fulgens",
18
+ "6": "alces-alces",
19
+ "7": "anas-platyrhynchos",
20
+ "8": "ankylosaurus-magniventris",
21
+ "9": "apis-mellifera",
22
+ "10": "aptenodytes-forsteri",
23
+ "11": "aquila-chrysaetos",
24
+ "12": "ara-macao",
25
+ "13": "architeuthis-dux",
26
+ "14": "ardea-herodias",
27
+ "15": "balaenoptera-musculus",
28
+ "16": "betta-splendens",
29
+ "17": "bison-bison",
30
+ "18": "bos-gaurus",
31
+ "19": "bos-taurus",
32
+ "20": "bradypus-variegatus",
33
+ "21": "branta-canadensis",
34
+ "22": "canis-lupus",
35
+ "23": "canis-lupus-familiaris",
36
+ "24": "carcharodon-carcharias",
37
+ "25": "cardinalis-cardinalis",
38
+ "26": "cathartes-aura",
39
+ "27": "centrochelys-sulcata",
40
+ "28": "centruroides-vittatus",
41
+ "29": "ceratitis-capitata",
42
+ "30": "ceratotherium-simum",
43
+ "31": "chelonia-mydas",
44
+ "32": "chrysemys-picta",
45
+ "33": "circus-hudsonius",
46
+ "34": "codium-fragile",
47
+ "35": "coelacanthiformes",
48
+ "36": "colaptes-auratus",
49
+ "37": "connochaetes-gnou",
50
+ "38": "correlophus-ciliatus",
51
+ "39": "crocodylus-niloticus",
52
+ "40": "crotalus-atrox",
53
+ "41": "crotophaga-sulcirostris",
54
+ "42": "cryptoprocta-ferox",
55
+ "43": "cyanocitta-cristata",
56
+ "44": "danaus-plexippus",
57
+ "45": "dasypus-novemcinctus",
58
+ "46": "delphinapterus-leucas",
59
+ "47": "dendrobatidae",
60
+ "48": "dermochelys-coriacea",
61
+ "49": "desmodus-rotundus",
62
+ "50": "diplodocus",
63
+ "51": "dugong-dugon",
64
+ "52": "eidolon-helvum",
65
+ "53": "enhydra-lutris",
66
+ "54": "enteroctopus-dofleini",
67
+ "55": "equus-caballus",
68
+ "56": "equus-quagga",
69
+ "57": "eudocimus-albus",
70
+ "58": "eunectes-murinus",
71
+ "59": "falco-peregrinus",
72
+ "60": "felis-catus",
73
+ "61": "formicidae",
74
+ "62": "gallus-gallus-domesticus",
75
+ "63": "gavialis-gangeticus",
76
+ "64": "geococcyx-californianus",
77
+ "65": "giraffa-camelopardalis",
78
+ "66": "gorilla-gorilla",
79
+ "67": "haliaeetus-leucocephalus",
80
+ "68": "hapalochlaena-maculosa",
81
+ "69": "heloderma-suspectum",
82
+ "70": "heterocera",
83
+ "71": "hippopotamus-amphibius",
84
+ "72": "homo-sapiens",
85
+ "73": "hydrurga-leptonyx",
86
+ "74": "icterus-galbula",
87
+ "75": "icterus-gularis",
88
+ "76": "icterus-spurius",
89
+ "77": "iguana-iguana",
90
+ "78": "iguanodon-bernissartensis",
91
+ "79": "inia-geoffrensis",
92
+ "80": "lampropeltis-triangulum",
93
+ "81": "lemur-catta",
94
+ "82": "lepus-americanus",
95
+ "83": "loxodonta-africana",
96
+ "84": "macropus-giganteus",
97
+ "85": "malayopython-reticulatus",
98
+ "86": "mammuthus-primigeniu",
99
+ "87": "martes-americana",
100
+ "88": "megaptera-novaeangliae",
101
+ "89": "melanerpes-carolinus",
102
+ "90": "mellisuga-helenae",
103
+ "91": "mergus-serrator",
104
+ "92": "mimus-polyglottos",
105
+ "93": "monodon-monoceros",
106
+ "94": "musca-domestica",
107
+ "95": "odobenus-rosmarus",
108
+ "96": "okapia-johnstoni",
109
+ "97": "ophiophagus-hannah",
110
+ "98": "orcinus-orca",
111
+ "99": "ornithorhynchus-anatinus",
112
+ "100": "ovis-aries",
113
+ "101": "ovis-canadensis",
114
+ "102": "panthera-leo",
115
+ "103": "panthera-onca",
116
+ "104": "panthera-pardus",
117
+ "105": "panthera-tigris",
118
+ "106": "pantherophis-alleghaniensis",
119
+ "107": "pantherophis-guttatus",
120
+ "108": "papilio-glaucus",
121
+ "109": "passerina-ciris",
122
+ "110": "pavo-cristatus",
123
+ "111": "periplaneta-americana",
124
+ "112": "phascolarctos-cinereus",
125
+ "113": "phoebetria-fusca",
126
+ "114": "phoenicopterus-ruber",
127
+ "115": "phyllobates-terribilis",
128
+ "116": "physalia-physalis",
129
+ "117": "physeter-macrocephalus",
130
+ "118": "poecile-atricapillus",
131
+ "119": "pongo-abelii",
132
+ "120": "procyon-lotor",
133
+ "121": "pteranodon-longiceps",
134
+ "122": "pterois-mombasae",
135
+ "123": "pterois-volitans",
136
+ "124": "puma-concolor",
137
+ "125": "rattus-rattus",
138
+ "126": "rusa-unicolor",
139
+ "127": "salmo-salar",
140
+ "128": "sciurus-carolinensis",
141
+ "129": "smilodon-populator",
142
+ "130": "spheniscus-demersus",
143
+ "131": "sphyrna-mokarran",
144
+ "132": "spinosaurus-aegyptiacus",
145
+ "133": "stegosaurus-stenops",
146
+ "134": "struthio-camelus",
147
+ "135": "tapirus",
148
+ "136": "tarsius-pumilus",
149
+ "137": "taurotragus-oryx",
150
+ "138": "telmatobufo-bullocki",
151
+ "139": "thryothorus-ludovicianus",
152
+ "140": "triceratops-horridus",
153
+ "141": "trilobita",
154
+ "142": "turdus-migratorius",
155
+ "143": "tursiops-truncatus",
156
+ "144": "tyrannosaurus-rex",
157
+ "145": "tyrannus-tyrannus",
158
+ "146": "ursus-arctos-horribilis",
159
+ "147": "ursus-maritimus",
160
+ "148": "varanus-komodoensis",
161
+ "149": "vulpes-vulpes",
162
+ "150": "vultur-gryphus"
163
+ },
164
+ "image_size": 224,
165
+ "initializer_range": 0.02,
166
+ "intermediate_size": 3072,
167
+ "label2id": {
168
+ "acinonyx-jubatus": 0,
169
+ "aethia-cristatella": 1,
170
+ "agalychnis-callidryas": 2,
171
+ "agkistrodon-contortrix": 3,
172
+ "ailuropoda-melanoleuca": 4,
173
+ "ailurus-fulgens": 5,
174
+ "alces-alces": 6,
175
+ "anas-platyrhynchos": 7,
176
+ "ankylosaurus-magniventris": 8,
177
+ "apis-mellifera": 9,
178
+ "aptenodytes-forsteri": 10,
179
+ "aquila-chrysaetos": 11,
180
+ "ara-macao": 12,
181
+ "architeuthis-dux": 13,
182
+ "ardea-herodias": 14,
183
+ "balaenoptera-musculus": 15,
184
+ "betta-splendens": 16,
185
+ "bison-bison": 17,
186
+ "bos-gaurus": 18,
187
+ "bos-taurus": 19,
188
+ "bradypus-variegatus": 20,
189
+ "branta-canadensis": 21,
190
+ "canis-lupus": 22,
191
+ "canis-lupus-familiaris": 23,
192
+ "carcharodon-carcharias": 24,
193
+ "cardinalis-cardinalis": 25,
194
+ "cathartes-aura": 26,
195
+ "centrochelys-sulcata": 27,
196
+ "centruroides-vittatus": 28,
197
+ "ceratitis-capitata": 29,
198
+ "ceratotherium-simum": 30,
199
+ "chelonia-mydas": 31,
200
+ "chrysemys-picta": 32,
201
+ "circus-hudsonius": 33,
202
+ "codium-fragile": 34,
203
+ "coelacanthiformes": 35,
204
+ "colaptes-auratus": 36,
205
+ "connochaetes-gnou": 37,
206
+ "correlophus-ciliatus": 38,
207
+ "crocodylus-niloticus": 39,
208
+ "crotalus-atrox": 40,
209
+ "crotophaga-sulcirostris": 41,
210
+ "cryptoprocta-ferox": 42,
211
+ "cyanocitta-cristata": 43,
212
+ "danaus-plexippus": 44,
213
+ "dasypus-novemcinctus": 45,
214
+ "delphinapterus-leucas": 46,
215
+ "dendrobatidae": 47,
216
+ "dermochelys-coriacea": 48,
217
+ "desmodus-rotundus": 49,
218
+ "diplodocus": 50,
219
+ "dugong-dugon": 51,
220
+ "eidolon-helvum": 52,
221
+ "enhydra-lutris": 53,
222
+ "enteroctopus-dofleini": 54,
223
+ "equus-caballus": 55,
224
+ "equus-quagga": 56,
225
+ "eudocimus-albus": 57,
226
+ "eunectes-murinus": 58,
227
+ "falco-peregrinus": 59,
228
+ "felis-catus": 60,
229
+ "formicidae": 61,
230
+ "gallus-gallus-domesticus": 62,
231
+ "gavialis-gangeticus": 63,
232
+ "geococcyx-californianus": 64,
233
+ "giraffa-camelopardalis": 65,
234
+ "gorilla-gorilla": 66,
235
+ "haliaeetus-leucocephalus": 67,
236
+ "hapalochlaena-maculosa": 68,
237
+ "heloderma-suspectum": 69,
238
+ "heterocera": 70,
239
+ "hippopotamus-amphibius": 71,
240
+ "homo-sapiens": 72,
241
+ "hydrurga-leptonyx": 73,
242
+ "icterus-galbula": 74,
243
+ "icterus-gularis": 75,
244
+ "icterus-spurius": 76,
245
+ "iguana-iguana": 77,
246
+ "iguanodon-bernissartensis": 78,
247
+ "inia-geoffrensis": 79,
248
+ "lampropeltis-triangulum": 80,
249
+ "lemur-catta": 81,
250
+ "lepus-americanus": 82,
251
+ "loxodonta-africana": 83,
252
+ "macropus-giganteus": 84,
253
+ "malayopython-reticulatus": 85,
254
+ "mammuthus-primigeniu": 86,
255
+ "martes-americana": 87,
256
+ "megaptera-novaeangliae": 88,
257
+ "melanerpes-carolinus": 89,
258
+ "mellisuga-helenae": 90,
259
+ "mergus-serrator": 91,
260
+ "mimus-polyglottos": 92,
261
+ "monodon-monoceros": 93,
262
+ "musca-domestica": 94,
263
+ "odobenus-rosmarus": 95,
264
+ "okapia-johnstoni": 96,
265
+ "ophiophagus-hannah": 97,
266
+ "orcinus-orca": 98,
267
+ "ornithorhynchus-anatinus": 99,
268
+ "ovis-aries": 100,
269
+ "ovis-canadensis": 101,
270
+ "panthera-leo": 102,
271
+ "panthera-onca": 103,
272
+ "panthera-pardus": 104,
273
+ "panthera-tigris": 105,
274
+ "pantherophis-alleghaniensis": 106,
275
+ "pantherophis-guttatus": 107,
276
+ "papilio-glaucus": 108,
277
+ "passerina-ciris": 109,
278
+ "pavo-cristatus": 110,
279
+ "periplaneta-americana": 111,
280
+ "phascolarctos-cinereus": 112,
281
+ "phoebetria-fusca": 113,
282
+ "phoenicopterus-ruber": 114,
283
+ "phyllobates-terribilis": 115,
284
+ "physalia-physalis": 116,
285
+ "physeter-macrocephalus": 117,
286
+ "poecile-atricapillus": 118,
287
+ "pongo-abelii": 119,
288
+ "procyon-lotor": 120,
289
+ "pteranodon-longiceps": 121,
290
+ "pterois-mombasae": 122,
291
+ "pterois-volitans": 123,
292
+ "puma-concolor": 124,
293
+ "rattus-rattus": 125,
294
+ "rusa-unicolor": 126,
295
+ "salmo-salar": 127,
296
+ "sciurus-carolinensis": 128,
297
+ "smilodon-populator": 129,
298
+ "spheniscus-demersus": 130,
299
+ "sphyrna-mokarran": 131,
300
+ "spinosaurus-aegyptiacus": 132,
301
+ "stegosaurus-stenops": 133,
302
+ "struthio-camelus": 134,
303
+ "tapirus": 135,
304
+ "tarsius-pumilus": 136,
305
+ "taurotragus-oryx": 137,
306
+ "telmatobufo-bullocki": 138,
307
+ "thryothorus-ludovicianus": 139,
308
+ "triceratops-horridus": 140,
309
+ "trilobita": 141,
310
+ "turdus-migratorius": 142,
311
+ "tursiops-truncatus": 143,
312
+ "tyrannosaurus-rex": 144,
313
+ "tyrannus-tyrannus": 145,
314
+ "ursus-arctos-horribilis": 146,
315
+ "ursus-maritimus": 147,
316
+ "varanus-komodoensis": 148,
317
+ "vulpes-vulpes": 149,
318
+ "vultur-gryphus": 150
319
+ },
320
+ "layer_norm_eps": 1e-12,
321
+ "model_type": "vit",
322
+ "num_attention_heads": 12,
323
+ "num_channels": 3,
324
+ "num_hidden_layers": 12,
325
+ "patch_size": 16,
326
+ "problem_type": "single_label_classification",
327
+ "qkv_bias": true,
328
+ "torch_dtype": "float32",
329
+ "transformers_version": "4.35.2"
330
+ }
checkpoint-11400/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13aed8024f292ca6815f925a9d723e2e91ca1e07d8b9f83ae9a783be58c791de
3
+ size 343682308
checkpoint-11400/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:029148e06c72f483fb776a4e1df2162d6971a6ac34f235c9e2f95963305ad2de
3
+ size 687485061
checkpoint-11400/preprocessor_config.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "do_rescale": true,
4
+ "do_resize": true,
5
+ "image_mean": [
6
+ 0.5,
7
+ 0.5,
8
+ 0.5
9
+ ],
10
+ "image_processor_type": "ViTImageProcessor",
11
+ "image_std": [
12
+ 0.5,
13
+ 0.5,
14
+ 0.5
15
+ ],
16
+ "resample": 2,
17
+ "rescale_factor": 0.00392156862745098,
18
+ "size": {
19
+ "height": 224,
20
+ "width": 224
21
+ }
22
+ }
checkpoint-11400/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7ce370b27413e7d46c5304724ae8628a55e9bf6703c444b59d99482052fef52
3
+ size 14575
checkpoint-11400/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b73593ac40c716498c384e77da995b9fd5edc159612e75b3ca5c428d3d93a40d
3
+ size 627
checkpoint-11400/trainer_state.json ADDED
@@ -0,0 +1,1051 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 1.375998616218567,
3
+ "best_model_checkpoint": "animal_151_types_image_detection/checkpoint-11400",
4
+ "epoch": 100.0,
5
+ "eval_steps": 500,
6
+ "global_step": 11400,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_accuracy": 0.037527593818984545,
14
+ "eval_loss": 4.962153434753418,
15
+ "eval_runtime": 14.7302,
16
+ "eval_samples_per_second": 123.013,
17
+ "eval_steps_per_second": 3.87,
18
+ "step": 114
19
+ },
20
+ {
21
+ "epoch": 2.0,
22
+ "eval_accuracy": 0.1335540838852097,
23
+ "eval_loss": 4.885277271270752,
24
+ "eval_runtime": 14.5295,
25
+ "eval_samples_per_second": 124.712,
26
+ "eval_steps_per_second": 3.923,
27
+ "step": 228
28
+ },
29
+ {
30
+ "epoch": 3.0,
31
+ "eval_accuracy": 0.3498896247240618,
32
+ "eval_loss": 4.794714450836182,
33
+ "eval_runtime": 14.7328,
34
+ "eval_samples_per_second": 122.99,
35
+ "eval_steps_per_second": 3.869,
36
+ "step": 342
37
+ },
38
+ {
39
+ "epoch": 4.0,
40
+ "eval_accuracy": 0.576710816777042,
41
+ "eval_loss": 4.702880382537842,
42
+ "eval_runtime": 15.1167,
43
+ "eval_samples_per_second": 119.868,
44
+ "eval_steps_per_second": 3.771,
45
+ "step": 456
46
+ },
47
+ {
48
+ "epoch": 4.39,
49
+ "learning_rate": 4.801762114537446e-06,
50
+ "loss": 4.8462,
51
+ "step": 500
52
+ },
53
+ {
54
+ "epoch": 5.0,
55
+ "eval_accuracy": 0.7400662251655629,
56
+ "eval_loss": 4.61031436920166,
57
+ "eval_runtime": 14.5797,
58
+ "eval_samples_per_second": 124.282,
59
+ "eval_steps_per_second": 3.91,
60
+ "step": 570
61
+ },
62
+ {
63
+ "epoch": 6.0,
64
+ "eval_accuracy": 0.8173289183222958,
65
+ "eval_loss": 4.516598701477051,
66
+ "eval_runtime": 14.6496,
67
+ "eval_samples_per_second": 123.689,
68
+ "eval_steps_per_second": 3.891,
69
+ "step": 684
70
+ },
71
+ {
72
+ "epoch": 7.0,
73
+ "eval_accuracy": 0.8559602649006622,
74
+ "eval_loss": 4.426823616027832,
75
+ "eval_runtime": 14.6782,
76
+ "eval_samples_per_second": 123.448,
77
+ "eval_steps_per_second": 3.883,
78
+ "step": 798
79
+ },
80
+ {
81
+ "epoch": 8.0,
82
+ "eval_accuracy": 0.8846578366445916,
83
+ "eval_loss": 4.338470935821533,
84
+ "eval_runtime": 14.8516,
85
+ "eval_samples_per_second": 122.007,
86
+ "eval_steps_per_second": 3.838,
87
+ "step": 912
88
+ },
89
+ {
90
+ "epoch": 8.77,
91
+ "learning_rate": 4.581497797356828e-06,
92
+ "loss": 4.4139,
93
+ "step": 1000
94
+ },
95
+ {
96
+ "epoch": 9.0,
97
+ "eval_accuracy": 0.8979028697571744,
98
+ "eval_loss": 4.253594875335693,
99
+ "eval_runtime": 14.9472,
100
+ "eval_samples_per_second": 121.226,
101
+ "eval_steps_per_second": 3.813,
102
+ "step": 1026
103
+ },
104
+ {
105
+ "epoch": 10.0,
106
+ "eval_accuracy": 0.9150110375275938,
107
+ "eval_loss": 4.168024063110352,
108
+ "eval_runtime": 14.7122,
109
+ "eval_samples_per_second": 123.163,
110
+ "eval_steps_per_second": 3.874,
111
+ "step": 1140
112
+ },
113
+ {
114
+ "epoch": 11.0,
115
+ "eval_accuracy": 0.9172185430463576,
116
+ "eval_loss": 4.086403846740723,
117
+ "eval_runtime": 14.7431,
118
+ "eval_samples_per_second": 122.905,
119
+ "eval_steps_per_second": 3.866,
120
+ "step": 1254
121
+ },
122
+ {
123
+ "epoch": 12.0,
124
+ "eval_accuracy": 0.9321192052980133,
125
+ "eval_loss": 4.009535789489746,
126
+ "eval_runtime": 14.777,
127
+ "eval_samples_per_second": 122.623,
128
+ "eval_steps_per_second": 3.857,
129
+ "step": 1368
130
+ },
131
+ {
132
+ "epoch": 13.0,
133
+ "eval_accuracy": 0.9398454746136865,
134
+ "eval_loss": 3.932218313217163,
135
+ "eval_runtime": 14.842,
136
+ "eval_samples_per_second": 122.086,
137
+ "eval_steps_per_second": 3.84,
138
+ "step": 1482
139
+ },
140
+ {
141
+ "epoch": 13.16,
142
+ "learning_rate": 4.361233480176212e-06,
143
+ "loss": 4.0075,
144
+ "step": 1500
145
+ },
146
+ {
147
+ "epoch": 14.0,
148
+ "eval_accuracy": 0.9420529801324503,
149
+ "eval_loss": 3.859485149383545,
150
+ "eval_runtime": 14.5871,
151
+ "eval_samples_per_second": 124.219,
152
+ "eval_steps_per_second": 3.908,
153
+ "step": 1596
154
+ },
155
+ {
156
+ "epoch": 15.0,
157
+ "eval_accuracy": 0.9442604856512141,
158
+ "eval_loss": 3.7879128456115723,
159
+ "eval_runtime": 14.6963,
160
+ "eval_samples_per_second": 123.296,
161
+ "eval_steps_per_second": 3.879,
162
+ "step": 1710
163
+ },
164
+ {
165
+ "epoch": 16.0,
166
+ "eval_accuracy": 0.9464679911699779,
167
+ "eval_loss": 3.7172069549560547,
168
+ "eval_runtime": 14.7356,
169
+ "eval_samples_per_second": 122.968,
170
+ "eval_steps_per_second": 3.868,
171
+ "step": 1824
172
+ },
173
+ {
174
+ "epoch": 17.0,
175
+ "eval_accuracy": 0.9481236203090507,
176
+ "eval_loss": 3.6492252349853516,
177
+ "eval_runtime": 20.1559,
178
+ "eval_samples_per_second": 89.899,
179
+ "eval_steps_per_second": 2.828,
180
+ "step": 1938
181
+ },
182
+ {
183
+ "epoch": 17.54,
184
+ "learning_rate": 4.140969162995595e-06,
185
+ "loss": 3.6551,
186
+ "step": 2000
187
+ },
188
+ {
189
+ "epoch": 18.0,
190
+ "eval_accuracy": 0.9503311258278145,
191
+ "eval_loss": 3.5814554691314697,
192
+ "eval_runtime": 17.2491,
193
+ "eval_samples_per_second": 105.049,
194
+ "eval_steps_per_second": 3.305,
195
+ "step": 2052
196
+ },
197
+ {
198
+ "epoch": 19.0,
199
+ "eval_accuracy": 0.9514348785871964,
200
+ "eval_loss": 3.517028331756592,
201
+ "eval_runtime": 14.8364,
202
+ "eval_samples_per_second": 122.132,
203
+ "eval_steps_per_second": 3.842,
204
+ "step": 2166
205
+ },
206
+ {
207
+ "epoch": 20.0,
208
+ "eval_accuracy": 0.9503311258278145,
209
+ "eval_loss": 3.4523494243621826,
210
+ "eval_runtime": 14.9385,
211
+ "eval_samples_per_second": 121.297,
212
+ "eval_steps_per_second": 3.816,
213
+ "step": 2280
214
+ },
215
+ {
216
+ "epoch": 21.0,
217
+ "eval_accuracy": 0.9541942604856513,
218
+ "eval_loss": 3.390517234802246,
219
+ "eval_runtime": 14.7336,
220
+ "eval_samples_per_second": 122.984,
221
+ "eval_steps_per_second": 3.869,
222
+ "step": 2394
223
+ },
224
+ {
225
+ "epoch": 21.93,
226
+ "learning_rate": 3.920704845814978e-06,
227
+ "loss": 3.34,
228
+ "step": 2500
229
+ },
230
+ {
231
+ "epoch": 22.0,
232
+ "eval_accuracy": 0.9558498896247241,
233
+ "eval_loss": 3.3292999267578125,
234
+ "eval_runtime": 14.7422,
235
+ "eval_samples_per_second": 122.913,
236
+ "eval_steps_per_second": 3.866,
237
+ "step": 2508
238
+ },
239
+ {
240
+ "epoch": 23.0,
241
+ "eval_accuracy": 0.9552980132450332,
242
+ "eval_loss": 3.2692325115203857,
243
+ "eval_runtime": 14.916,
244
+ "eval_samples_per_second": 121.48,
245
+ "eval_steps_per_second": 3.821,
246
+ "step": 2622
247
+ },
248
+ {
249
+ "epoch": 24.0,
250
+ "eval_accuracy": 0.9564017660044151,
251
+ "eval_loss": 3.2137107849121094,
252
+ "eval_runtime": 14.7629,
253
+ "eval_samples_per_second": 122.74,
254
+ "eval_steps_per_second": 3.861,
255
+ "step": 2736
256
+ },
257
+ {
258
+ "epoch": 25.0,
259
+ "eval_accuracy": 0.9575055187637969,
260
+ "eval_loss": 3.156517267227173,
261
+ "eval_runtime": 14.7516,
262
+ "eval_samples_per_second": 122.834,
263
+ "eval_steps_per_second": 3.864,
264
+ "step": 2850
265
+ },
266
+ {
267
+ "epoch": 26.0,
268
+ "eval_accuracy": 0.9591611479028698,
269
+ "eval_loss": 3.1020307540893555,
270
+ "eval_runtime": 14.6198,
271
+ "eval_samples_per_second": 123.942,
272
+ "eval_steps_per_second": 3.899,
273
+ "step": 2964
274
+ },
275
+ {
276
+ "epoch": 26.32,
277
+ "learning_rate": 3.7004405286343614e-06,
278
+ "loss": 3.062,
279
+ "step": 3000
280
+ },
281
+ {
282
+ "epoch": 27.0,
283
+ "eval_accuracy": 0.9580573951434879,
284
+ "eval_loss": 3.047849178314209,
285
+ "eval_runtime": 14.747,
286
+ "eval_samples_per_second": 122.872,
287
+ "eval_steps_per_second": 3.865,
288
+ "step": 3078
289
+ },
290
+ {
291
+ "epoch": 28.0,
292
+ "eval_accuracy": 0.9597130242825607,
293
+ "eval_loss": 2.9951817989349365,
294
+ "eval_runtime": 14.6085,
295
+ "eval_samples_per_second": 124.038,
296
+ "eval_steps_per_second": 3.902,
297
+ "step": 3192
298
+ },
299
+ {
300
+ "epoch": 29.0,
301
+ "eval_accuracy": 0.9608167770419426,
302
+ "eval_loss": 2.9445724487304688,
303
+ "eval_runtime": 14.744,
304
+ "eval_samples_per_second": 122.897,
305
+ "eval_steps_per_second": 3.866,
306
+ "step": 3306
307
+ },
308
+ {
309
+ "epoch": 30.0,
310
+ "eval_accuracy": 0.9641280353200883,
311
+ "eval_loss": 2.8922934532165527,
312
+ "eval_runtime": 14.7257,
313
+ "eval_samples_per_second": 123.05,
314
+ "eval_steps_per_second": 3.871,
315
+ "step": 3420
316
+ },
317
+ {
318
+ "epoch": 30.7,
319
+ "learning_rate": 3.4801762114537445e-06,
320
+ "loss": 2.8103,
321
+ "step": 3500
322
+ },
323
+ {
324
+ "epoch": 31.0,
325
+ "eval_accuracy": 0.9635761589403974,
326
+ "eval_loss": 2.8442115783691406,
327
+ "eval_runtime": 14.5837,
328
+ "eval_samples_per_second": 124.248,
329
+ "eval_steps_per_second": 3.908,
330
+ "step": 3534
331
+ },
332
+ {
333
+ "epoch": 32.0,
334
+ "eval_accuracy": 0.9624724061810155,
335
+ "eval_loss": 2.7976019382476807,
336
+ "eval_runtime": 14.8078,
337
+ "eval_samples_per_second": 122.368,
338
+ "eval_steps_per_second": 3.849,
339
+ "step": 3648
340
+ },
341
+ {
342
+ "epoch": 33.0,
343
+ "eval_accuracy": 0.9663355408388521,
344
+ "eval_loss": 2.749441623687744,
345
+ "eval_runtime": 14.8845,
346
+ "eval_samples_per_second": 121.737,
347
+ "eval_steps_per_second": 3.829,
348
+ "step": 3762
349
+ },
350
+ {
351
+ "epoch": 34.0,
352
+ "eval_accuracy": 0.9646799116997793,
353
+ "eval_loss": 2.702268600463867,
354
+ "eval_runtime": 14.6998,
355
+ "eval_samples_per_second": 123.267,
356
+ "eval_steps_per_second": 3.878,
357
+ "step": 3876
358
+ },
359
+ {
360
+ "epoch": 35.0,
361
+ "eval_accuracy": 0.9646799116997793,
362
+ "eval_loss": 2.656121253967285,
363
+ "eval_runtime": 14.9899,
364
+ "eval_samples_per_second": 120.881,
365
+ "eval_steps_per_second": 3.803,
366
+ "step": 3990
367
+ },
368
+ {
369
+ "epoch": 35.09,
370
+ "learning_rate": 3.259911894273128e-06,
371
+ "loss": 2.5826,
372
+ "step": 4000
373
+ },
374
+ {
375
+ "epoch": 36.0,
376
+ "eval_accuracy": 0.9657836644591612,
377
+ "eval_loss": 2.613430976867676,
378
+ "eval_runtime": 14.4375,
379
+ "eval_samples_per_second": 125.507,
380
+ "eval_steps_per_second": 3.948,
381
+ "step": 4104
382
+ },
383
+ {
384
+ "epoch": 37.0,
385
+ "eval_accuracy": 0.9663355408388521,
386
+ "eval_loss": 2.5684773921966553,
387
+ "eval_runtime": 14.8268,
388
+ "eval_samples_per_second": 122.212,
389
+ "eval_steps_per_second": 3.844,
390
+ "step": 4218
391
+ },
392
+ {
393
+ "epoch": 38.0,
394
+ "eval_accuracy": 0.9685430463576159,
395
+ "eval_loss": 2.5256078243255615,
396
+ "eval_runtime": 14.6038,
397
+ "eval_samples_per_second": 124.078,
398
+ "eval_steps_per_second": 3.903,
399
+ "step": 4332
400
+ },
401
+ {
402
+ "epoch": 39.0,
403
+ "eval_accuracy": 0.9696467991169978,
404
+ "eval_loss": 2.4859821796417236,
405
+ "eval_runtime": 14.7498,
406
+ "eval_samples_per_second": 122.849,
407
+ "eval_steps_per_second": 3.864,
408
+ "step": 4446
409
+ },
410
+ {
411
+ "epoch": 39.47,
412
+ "learning_rate": 3.039647577092511e-06,
413
+ "loss": 2.3758,
414
+ "step": 4500
415
+ },
416
+ {
417
+ "epoch": 40.0,
418
+ "eval_accuracy": 0.967439293598234,
419
+ "eval_loss": 2.4448373317718506,
420
+ "eval_runtime": 14.4892,
421
+ "eval_samples_per_second": 125.058,
422
+ "eval_steps_per_second": 3.934,
423
+ "step": 4560
424
+ },
425
+ {
426
+ "epoch": 41.0,
427
+ "eval_accuracy": 0.9707505518763797,
428
+ "eval_loss": 2.4062910079956055,
429
+ "eval_runtime": 14.5027,
430
+ "eval_samples_per_second": 124.943,
431
+ "eval_steps_per_second": 3.93,
432
+ "step": 4674
433
+ },
434
+ {
435
+ "epoch": 42.0,
436
+ "eval_accuracy": 0.9696467991169978,
437
+ "eval_loss": 2.366445302963257,
438
+ "eval_runtime": 14.5967,
439
+ "eval_samples_per_second": 124.138,
440
+ "eval_steps_per_second": 3.905,
441
+ "step": 4788
442
+ },
443
+ {
444
+ "epoch": 43.0,
445
+ "eval_accuracy": 0.9696467991169978,
446
+ "eval_loss": 2.3301877975463867,
447
+ "eval_runtime": 15.4794,
448
+ "eval_samples_per_second": 117.059,
449
+ "eval_steps_per_second": 3.682,
450
+ "step": 4902
451
+ },
452
+ {
453
+ "epoch": 43.86,
454
+ "learning_rate": 2.819383259911895e-06,
455
+ "loss": 2.1901,
456
+ "step": 5000
457
+ },
458
+ {
459
+ "epoch": 44.0,
460
+ "eval_accuracy": 0.9685430463576159,
461
+ "eval_loss": 2.292541980743408,
462
+ "eval_runtime": 14.8646,
463
+ "eval_samples_per_second": 121.9,
464
+ "eval_steps_per_second": 3.835,
465
+ "step": 5016
466
+ },
467
+ {
468
+ "epoch": 45.0,
469
+ "eval_accuracy": 0.9713024282560706,
470
+ "eval_loss": 2.258281707763672,
471
+ "eval_runtime": 14.6506,
472
+ "eval_samples_per_second": 123.681,
473
+ "eval_steps_per_second": 3.891,
474
+ "step": 5130
475
+ },
476
+ {
477
+ "epoch": 46.0,
478
+ "eval_accuracy": 0.9718543046357616,
479
+ "eval_loss": 2.2219057083129883,
480
+ "eval_runtime": 14.6119,
481
+ "eval_samples_per_second": 124.009,
482
+ "eval_steps_per_second": 3.901,
483
+ "step": 5244
484
+ },
485
+ {
486
+ "epoch": 47.0,
487
+ "eval_accuracy": 0.9713024282560706,
488
+ "eval_loss": 2.1887381076812744,
489
+ "eval_runtime": 14.7799,
490
+ "eval_samples_per_second": 122.599,
491
+ "eval_steps_per_second": 3.857,
492
+ "step": 5358
493
+ },
494
+ {
495
+ "epoch": 48.0,
496
+ "eval_accuracy": 0.9724061810154525,
497
+ "eval_loss": 2.15564227104187,
498
+ "eval_runtime": 14.5803,
499
+ "eval_samples_per_second": 124.277,
500
+ "eval_steps_per_second": 3.909,
501
+ "step": 5472
502
+ },
503
+ {
504
+ "epoch": 48.25,
505
+ "learning_rate": 2.599118942731278e-06,
506
+ "loss": 2.0234,
507
+ "step": 5500
508
+ },
509
+ {
510
+ "epoch": 49.0,
511
+ "eval_accuracy": 0.9718543046357616,
512
+ "eval_loss": 2.1227617263793945,
513
+ "eval_runtime": 14.678,
514
+ "eval_samples_per_second": 123.45,
515
+ "eval_steps_per_second": 3.883,
516
+ "step": 5586
517
+ },
518
+ {
519
+ "epoch": 50.0,
520
+ "eval_accuracy": 0.9718543046357616,
521
+ "eval_loss": 2.0911219120025635,
522
+ "eval_runtime": 14.5634,
523
+ "eval_samples_per_second": 124.421,
524
+ "eval_steps_per_second": 3.914,
525
+ "step": 5700
526
+ },
527
+ {
528
+ "epoch": 51.0,
529
+ "eval_accuracy": 0.9718543046357616,
530
+ "eval_loss": 2.058539628982544,
531
+ "eval_runtime": 14.5546,
532
+ "eval_samples_per_second": 124.497,
533
+ "eval_steps_per_second": 3.916,
534
+ "step": 5814
535
+ },
536
+ {
537
+ "epoch": 52.0,
538
+ "eval_accuracy": 0.9724061810154525,
539
+ "eval_loss": 2.030808448791504,
540
+ "eval_runtime": 14.7159,
541
+ "eval_samples_per_second": 123.132,
542
+ "eval_steps_per_second": 3.873,
543
+ "step": 5928
544
+ },
545
+ {
546
+ "epoch": 52.63,
547
+ "learning_rate": 2.378854625550661e-06,
548
+ "loss": 1.876,
549
+ "step": 6000
550
+ },
551
+ {
552
+ "epoch": 53.0,
553
+ "eval_accuracy": 0.9729580573951435,
554
+ "eval_loss": 1.999698281288147,
555
+ "eval_runtime": 14.624,
556
+ "eval_samples_per_second": 123.906,
557
+ "eval_steps_per_second": 3.898,
558
+ "step": 6042
559
+ },
560
+ {
561
+ "epoch": 54.0,
562
+ "eval_accuracy": 0.9729580573951435,
563
+ "eval_loss": 1.9714460372924805,
564
+ "eval_runtime": 14.8384,
565
+ "eval_samples_per_second": 122.116,
566
+ "eval_steps_per_second": 3.841,
567
+ "step": 6156
568
+ },
569
+ {
570
+ "epoch": 55.0,
571
+ "eval_accuracy": 0.9724061810154525,
572
+ "eval_loss": 1.944514274597168,
573
+ "eval_runtime": 14.5863,
574
+ "eval_samples_per_second": 124.226,
575
+ "eval_steps_per_second": 3.908,
576
+ "step": 6270
577
+ },
578
+ {
579
+ "epoch": 56.0,
580
+ "eval_accuracy": 0.9718543046357616,
581
+ "eval_loss": 1.9172853231430054,
582
+ "eval_runtime": 14.6007,
583
+ "eval_samples_per_second": 124.103,
584
+ "eval_steps_per_second": 3.904,
585
+ "step": 6384
586
+ },
587
+ {
588
+ "epoch": 57.0,
589
+ "eval_accuracy": 0.9724061810154525,
590
+ "eval_loss": 1.8919694423675537,
591
+ "eval_runtime": 14.4525,
592
+ "eval_samples_per_second": 125.377,
593
+ "eval_steps_per_second": 3.944,
594
+ "step": 6498
595
+ },
596
+ {
597
+ "epoch": 57.02,
598
+ "learning_rate": 2.1585903083700445e-06,
599
+ "loss": 1.7451,
600
+ "step": 6500
601
+ },
602
+ {
603
+ "epoch": 58.0,
604
+ "eval_accuracy": 0.9740618101545254,
605
+ "eval_loss": 1.8659210205078125,
606
+ "eval_runtime": 14.7567,
607
+ "eval_samples_per_second": 122.791,
608
+ "eval_steps_per_second": 3.863,
609
+ "step": 6612
610
+ },
611
+ {
612
+ "epoch": 59.0,
613
+ "eval_accuracy": 0.9729580573951435,
614
+ "eval_loss": 1.842057704925537,
615
+ "eval_runtime": 14.733,
616
+ "eval_samples_per_second": 122.989,
617
+ "eval_steps_per_second": 3.869,
618
+ "step": 6726
619
+ },
620
+ {
621
+ "epoch": 60.0,
622
+ "eval_accuracy": 0.9746136865342163,
623
+ "eval_loss": 1.8180880546569824,
624
+ "eval_runtime": 14.5204,
625
+ "eval_samples_per_second": 124.79,
626
+ "eval_steps_per_second": 3.926,
627
+ "step": 6840
628
+ },
629
+ {
630
+ "epoch": 61.0,
631
+ "eval_accuracy": 0.9735099337748344,
632
+ "eval_loss": 1.7939091920852661,
633
+ "eval_runtime": 14.6724,
634
+ "eval_samples_per_second": 123.497,
635
+ "eval_steps_per_second": 3.885,
636
+ "step": 6954
637
+ },
638
+ {
639
+ "epoch": 61.4,
640
+ "learning_rate": 1.9383259911894276e-06,
641
+ "loss": 1.6286,
642
+ "step": 7000
643
+ },
644
+ {
645
+ "epoch": 62.0,
646
+ "eval_accuracy": 0.9729580573951435,
647
+ "eval_loss": 1.7723444700241089,
648
+ "eval_runtime": 14.599,
649
+ "eval_samples_per_second": 124.118,
650
+ "eval_steps_per_second": 3.904,
651
+ "step": 7068
652
+ },
653
+ {
654
+ "epoch": 63.0,
655
+ "eval_accuracy": 0.9740618101545254,
656
+ "eval_loss": 1.7489854097366333,
657
+ "eval_runtime": 14.5258,
658
+ "eval_samples_per_second": 124.743,
659
+ "eval_steps_per_second": 3.924,
660
+ "step": 7182
661
+ },
662
+ {
663
+ "epoch": 64.0,
664
+ "eval_accuracy": 0.9757174392935982,
665
+ "eval_loss": 1.7285088300704956,
666
+ "eval_runtime": 14.4828,
667
+ "eval_samples_per_second": 125.114,
668
+ "eval_steps_per_second": 3.936,
669
+ "step": 7296
670
+ },
671
+ {
672
+ "epoch": 65.0,
673
+ "eval_accuracy": 0.9740618101545254,
674
+ "eval_loss": 1.7077668905258179,
675
+ "eval_runtime": 14.7222,
676
+ "eval_samples_per_second": 123.079,
677
+ "eval_steps_per_second": 3.872,
678
+ "step": 7410
679
+ },
680
+ {
681
+ "epoch": 65.79,
682
+ "learning_rate": 1.7180616740088108e-06,
683
+ "loss": 1.5281,
684
+ "step": 7500
685
+ },
686
+ {
687
+ "epoch": 66.0,
688
+ "eval_accuracy": 0.9746136865342163,
689
+ "eval_loss": 1.6885572671890259,
690
+ "eval_runtime": 14.7611,
691
+ "eval_samples_per_second": 122.755,
692
+ "eval_steps_per_second": 3.862,
693
+ "step": 7524
694
+ },
695
+ {
696
+ "epoch": 67.0,
697
+ "eval_accuracy": 0.9740618101545254,
698
+ "eval_loss": 1.6697474718093872,
699
+ "eval_runtime": 14.5138,
700
+ "eval_samples_per_second": 124.846,
701
+ "eval_steps_per_second": 3.927,
702
+ "step": 7638
703
+ },
704
+ {
705
+ "epoch": 68.0,
706
+ "eval_accuracy": 0.9746136865342163,
707
+ "eval_loss": 1.6512248516082764,
708
+ "eval_runtime": 14.4806,
709
+ "eval_samples_per_second": 125.133,
710
+ "eval_steps_per_second": 3.936,
711
+ "step": 7752
712
+ },
713
+ {
714
+ "epoch": 69.0,
715
+ "eval_accuracy": 0.9735099337748344,
716
+ "eval_loss": 1.6349101066589355,
717
+ "eval_runtime": 14.6474,
718
+ "eval_samples_per_second": 123.708,
719
+ "eval_steps_per_second": 3.891,
720
+ "step": 7866
721
+ },
722
+ {
723
+ "epoch": 70.0,
724
+ "eval_accuracy": 0.9729580573951435,
725
+ "eval_loss": 1.6167147159576416,
726
+ "eval_runtime": 14.5436,
727
+ "eval_samples_per_second": 124.591,
728
+ "eval_steps_per_second": 3.919,
729
+ "step": 7980
730
+ },
731
+ {
732
+ "epoch": 70.18,
733
+ "learning_rate": 1.497797356828194e-06,
734
+ "loss": 1.4403,
735
+ "step": 8000
736
+ },
737
+ {
738
+ "epoch": 71.0,
739
+ "eval_accuracy": 0.9729580573951435,
740
+ "eval_loss": 1.600691556930542,
741
+ "eval_runtime": 14.4531,
742
+ "eval_samples_per_second": 125.371,
743
+ "eval_steps_per_second": 3.944,
744
+ "step": 8094
745
+ },
746
+ {
747
+ "epoch": 72.0,
748
+ "eval_accuracy": 0.9746136865342163,
749
+ "eval_loss": 1.5854783058166504,
750
+ "eval_runtime": 14.6051,
751
+ "eval_samples_per_second": 124.067,
752
+ "eval_steps_per_second": 3.903,
753
+ "step": 8208
754
+ },
755
+ {
756
+ "epoch": 73.0,
757
+ "eval_accuracy": 0.9751655629139073,
758
+ "eval_loss": 1.5697646141052246,
759
+ "eval_runtime": 14.7222,
760
+ "eval_samples_per_second": 123.079,
761
+ "eval_steps_per_second": 3.872,
762
+ "step": 8322
763
+ },
764
+ {
765
+ "epoch": 74.0,
766
+ "eval_accuracy": 0.9735099337748344,
767
+ "eval_loss": 1.5558655261993408,
768
+ "eval_runtime": 14.7278,
769
+ "eval_samples_per_second": 123.033,
770
+ "eval_steps_per_second": 3.87,
771
+ "step": 8436
772
+ },
773
+ {
774
+ "epoch": 74.56,
775
+ "learning_rate": 1.2775330396475772e-06,
776
+ "loss": 1.3684,
777
+ "step": 8500
778
+ },
779
+ {
780
+ "epoch": 75.0,
781
+ "eval_accuracy": 0.9746136865342163,
782
+ "eval_loss": 1.5405701398849487,
783
+ "eval_runtime": 14.4937,
784
+ "eval_samples_per_second": 125.02,
785
+ "eval_steps_per_second": 3.933,
786
+ "step": 8550
787
+ },
788
+ {
789
+ "epoch": 76.0,
790
+ "eval_accuracy": 0.9735099337748344,
791
+ "eval_loss": 1.52810537815094,
792
+ "eval_runtime": 14.5545,
793
+ "eval_samples_per_second": 124.497,
794
+ "eval_steps_per_second": 3.916,
795
+ "step": 8664
796
+ },
797
+ {
798
+ "epoch": 77.0,
799
+ "eval_accuracy": 0.9735099337748344,
800
+ "eval_loss": 1.5153011083602905,
801
+ "eval_runtime": 14.6637,
802
+ "eval_samples_per_second": 123.57,
803
+ "eval_steps_per_second": 3.887,
804
+ "step": 8778
805
+ },
806
+ {
807
+ "epoch": 78.0,
808
+ "eval_accuracy": 0.9746136865342163,
809
+ "eval_loss": 1.5028570890426636,
810
+ "eval_runtime": 14.5939,
811
+ "eval_samples_per_second": 124.162,
812
+ "eval_steps_per_second": 3.906,
813
+ "step": 8892
814
+ },
815
+ {
816
+ "epoch": 78.95,
817
+ "learning_rate": 1.0572687224669604e-06,
818
+ "loss": 1.3041,
819
+ "step": 9000
820
+ },
821
+ {
822
+ "epoch": 79.0,
823
+ "eval_accuracy": 0.9740618101545254,
824
+ "eval_loss": 1.4909206628799438,
825
+ "eval_runtime": 14.5501,
826
+ "eval_samples_per_second": 124.535,
827
+ "eval_steps_per_second": 3.918,
828
+ "step": 9006
829
+ },
830
+ {
831
+ "epoch": 80.0,
832
+ "eval_accuracy": 0.9740618101545254,
833
+ "eval_loss": 1.4797635078430176,
834
+ "eval_runtime": 14.5945,
835
+ "eval_samples_per_second": 124.157,
836
+ "eval_steps_per_second": 3.906,
837
+ "step": 9120
838
+ },
839
+ {
840
+ "epoch": 81.0,
841
+ "eval_accuracy": 0.9751655629139073,
842
+ "eval_loss": 1.469772219657898,
843
+ "eval_runtime": 14.868,
844
+ "eval_samples_per_second": 121.873,
845
+ "eval_steps_per_second": 3.834,
846
+ "step": 9234
847
+ },
848
+ {
849
+ "epoch": 82.0,
850
+ "eval_accuracy": 0.9740618101545254,
851
+ "eval_loss": 1.4597550630569458,
852
+ "eval_runtime": 14.5863,
853
+ "eval_samples_per_second": 124.226,
854
+ "eval_steps_per_second": 3.908,
855
+ "step": 9348
856
+ },
857
+ {
858
+ "epoch": 83.0,
859
+ "eval_accuracy": 0.9746136865342163,
860
+ "eval_loss": 1.4507455825805664,
861
+ "eval_runtime": 14.5654,
862
+ "eval_samples_per_second": 124.404,
863
+ "eval_steps_per_second": 3.913,
864
+ "step": 9462
865
+ },
866
+ {
867
+ "epoch": 83.33,
868
+ "learning_rate": 8.370044052863437e-07,
869
+ "loss": 1.2554,
870
+ "step": 9500
871
+ },
872
+ {
873
+ "epoch": 84.0,
874
+ "eval_accuracy": 0.9735099337748344,
875
+ "eval_loss": 1.4420080184936523,
876
+ "eval_runtime": 14.7476,
877
+ "eval_samples_per_second": 122.868,
878
+ "eval_steps_per_second": 3.865,
879
+ "step": 9576
880
+ },
881
+ {
882
+ "epoch": 85.0,
883
+ "eval_accuracy": 0.9740618101545254,
884
+ "eval_loss": 1.433323860168457,
885
+ "eval_runtime": 14.5881,
886
+ "eval_samples_per_second": 124.211,
887
+ "eval_steps_per_second": 3.907,
888
+ "step": 9690
889
+ },
890
+ {
891
+ "epoch": 86.0,
892
+ "eval_accuracy": 0.9740618101545254,
893
+ "eval_loss": 1.4266729354858398,
894
+ "eval_runtime": 14.6204,
895
+ "eval_samples_per_second": 123.937,
896
+ "eval_steps_per_second": 3.899,
897
+ "step": 9804
898
+ },
899
+ {
900
+ "epoch": 87.0,
901
+ "eval_accuracy": 0.9746136865342163,
902
+ "eval_loss": 1.419144630432129,
903
+ "eval_runtime": 14.7023,
904
+ "eval_samples_per_second": 123.246,
905
+ "eval_steps_per_second": 3.877,
906
+ "step": 9918
907
+ },
908
+ {
909
+ "epoch": 87.72,
910
+ "learning_rate": 6.16740088105727e-07,
911
+ "loss": 1.2166,
912
+ "step": 10000
913
+ },
914
+ {
915
+ "epoch": 88.0,
916
+ "eval_accuracy": 0.9746136865342163,
917
+ "eval_loss": 1.41357421875,
918
+ "eval_runtime": 14.7197,
919
+ "eval_samples_per_second": 123.101,
920
+ "eval_steps_per_second": 3.872,
921
+ "step": 10032
922
+ },
923
+ {
924
+ "epoch": 89.0,
925
+ "eval_accuracy": 0.9751655629139073,
926
+ "eval_loss": 1.4069515466690063,
927
+ "eval_runtime": 14.5913,
928
+ "eval_samples_per_second": 124.184,
929
+ "eval_steps_per_second": 3.906,
930
+ "step": 10146
931
+ },
932
+ {
933
+ "epoch": 90.0,
934
+ "eval_accuracy": 0.9751655629139073,
935
+ "eval_loss": 1.4011104106903076,
936
+ "eval_runtime": 14.4858,
937
+ "eval_samples_per_second": 125.088,
938
+ "eval_steps_per_second": 3.935,
939
+ "step": 10260
940
+ },
941
+ {
942
+ "epoch": 91.0,
943
+ "eval_accuracy": 0.9751655629139073,
944
+ "eval_loss": 1.396867036819458,
945
+ "eval_runtime": 14.4869,
946
+ "eval_samples_per_second": 125.079,
947
+ "eval_steps_per_second": 3.935,
948
+ "step": 10374
949
+ },
950
+ {
951
+ "epoch": 92.0,
952
+ "eval_accuracy": 0.9751655629139073,
953
+ "eval_loss": 1.3927924633026123,
954
+ "eval_runtime": 14.9674,
955
+ "eval_samples_per_second": 121.063,
956
+ "eval_steps_per_second": 3.808,
957
+ "step": 10488
958
+ },
959
+ {
960
+ "epoch": 92.11,
961
+ "learning_rate": 3.964757709251102e-07,
962
+ "loss": 1.1885,
963
+ "step": 10500
964
+ },
965
+ {
966
+ "epoch": 93.0,
967
+ "eval_accuracy": 0.9740618101545254,
968
+ "eval_loss": 1.3884556293487549,
969
+ "eval_runtime": 15.051,
970
+ "eval_samples_per_second": 120.39,
971
+ "eval_steps_per_second": 3.787,
972
+ "step": 10602
973
+ },
974
+ {
975
+ "epoch": 94.0,
976
+ "eval_accuracy": 0.9740618101545254,
977
+ "eval_loss": 1.3855311870574951,
978
+ "eval_runtime": 14.5082,
979
+ "eval_samples_per_second": 124.895,
980
+ "eval_steps_per_second": 3.929,
981
+ "step": 10716
982
+ },
983
+ {
984
+ "epoch": 95.0,
985
+ "eval_accuracy": 0.9746136865342163,
986
+ "eval_loss": 1.3824039697647095,
987
+ "eval_runtime": 14.8975,
988
+ "eval_samples_per_second": 121.631,
989
+ "eval_steps_per_second": 3.826,
990
+ "step": 10830
991
+ },
992
+ {
993
+ "epoch": 96.0,
994
+ "eval_accuracy": 0.9746136865342163,
995
+ "eval_loss": 1.3800771236419678,
996
+ "eval_runtime": 14.7571,
997
+ "eval_samples_per_second": 122.788,
998
+ "eval_steps_per_second": 3.863,
999
+ "step": 10944
1000
+ },
1001
+ {
1002
+ "epoch": 96.49,
1003
+ "learning_rate": 1.7621145374449343e-07,
1004
+ "loss": 1.1703,
1005
+ "step": 11000
1006
+ },
1007
+ {
1008
+ "epoch": 97.0,
1009
+ "eval_accuracy": 0.9746136865342163,
1010
+ "eval_loss": 1.378131628036499,
1011
+ "eval_runtime": 14.7894,
1012
+ "eval_samples_per_second": 122.52,
1013
+ "eval_steps_per_second": 3.854,
1014
+ "step": 11058
1015
+ },
1016
+ {
1017
+ "epoch": 98.0,
1018
+ "eval_accuracy": 0.9746136865342163,
1019
+ "eval_loss": 1.3769623041152954,
1020
+ "eval_runtime": 14.5124,
1021
+ "eval_samples_per_second": 124.858,
1022
+ "eval_steps_per_second": 3.928,
1023
+ "step": 11172
1024
+ },
1025
+ {
1026
+ "epoch": 99.0,
1027
+ "eval_accuracy": 0.9746136865342163,
1028
+ "eval_loss": 1.3762928247451782,
1029
+ "eval_runtime": 14.7379,
1030
+ "eval_samples_per_second": 122.948,
1031
+ "eval_steps_per_second": 3.868,
1032
+ "step": 11286
1033
+ },
1034
+ {
1035
+ "epoch": 100.0,
1036
+ "eval_accuracy": 0.9746136865342163,
1037
+ "eval_loss": 1.375998616218567,
1038
+ "eval_runtime": 15.1012,
1039
+ "eval_samples_per_second": 119.991,
1040
+ "eval_steps_per_second": 3.775,
1041
+ "step": 11400
1042
+ }
1043
+ ],
1044
+ "logging_steps": 500,
1045
+ "max_steps": 11400,
1046
+ "num_train_epochs": 100,
1047
+ "save_steps": 500,
1048
+ "total_flos": 5.624120064761856e+19,
1049
+ "trial_name": null,
1050
+ "trial_params": null
1051
+ }
checkpoint-11400/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7e242550be2a583a594f2ba509b483bcf8b85e863a192362f438d02195f34ab
3
+ size 4091
config.json ADDED
@@ -0,0 +1,330 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "google/vit-base-patch16-224-in21k",
3
+ "architectures": [
4
+ "ViTForImageClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.0,
7
+ "encoder_stride": 16,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.0,
10
+ "hidden_size": 768,
11
+ "id2label": {
12
+ "0": "acinonyx-jubatus",
13
+ "1": "aethia-cristatella",
14
+ "2": "agalychnis-callidryas",
15
+ "3": "agkistrodon-contortrix",
16
+ "4": "ailuropoda-melanoleuca",
17
+ "5": "ailurus-fulgens",
18
+ "6": "alces-alces",
19
+ "7": "anas-platyrhynchos",
20
+ "8": "ankylosaurus-magniventris",
21
+ "9": "apis-mellifera",
22
+ "10": "aptenodytes-forsteri",
23
+ "11": "aquila-chrysaetos",
24
+ "12": "ara-macao",
25
+ "13": "architeuthis-dux",
26
+ "14": "ardea-herodias",
27
+ "15": "balaenoptera-musculus",
28
+ "16": "betta-splendens",
29
+ "17": "bison-bison",
30
+ "18": "bos-gaurus",
31
+ "19": "bos-taurus",
32
+ "20": "bradypus-variegatus",
33
+ "21": "branta-canadensis",
34
+ "22": "canis-lupus",
35
+ "23": "canis-lupus-familiaris",
36
+ "24": "carcharodon-carcharias",
37
+ "25": "cardinalis-cardinalis",
38
+ "26": "cathartes-aura",
39
+ "27": "centrochelys-sulcata",
40
+ "28": "centruroides-vittatus",
41
+ "29": "ceratitis-capitata",
42
+ "30": "ceratotherium-simum",
43
+ "31": "chelonia-mydas",
44
+ "32": "chrysemys-picta",
45
+ "33": "circus-hudsonius",
46
+ "34": "codium-fragile",
47
+ "35": "coelacanthiformes",
48
+ "36": "colaptes-auratus",
49
+ "37": "connochaetes-gnou",
50
+ "38": "correlophus-ciliatus",
51
+ "39": "crocodylus-niloticus",
52
+ "40": "crotalus-atrox",
53
+ "41": "crotophaga-sulcirostris",
54
+ "42": "cryptoprocta-ferox",
55
+ "43": "cyanocitta-cristata",
56
+ "44": "danaus-plexippus",
57
+ "45": "dasypus-novemcinctus",
58
+ "46": "delphinapterus-leucas",
59
+ "47": "dendrobatidae",
60
+ "48": "dermochelys-coriacea",
61
+ "49": "desmodus-rotundus",
62
+ "50": "diplodocus",
63
+ "51": "dugong-dugon",
64
+ "52": "eidolon-helvum",
65
+ "53": "enhydra-lutris",
66
+ "54": "enteroctopus-dofleini",
67
+ "55": "equus-caballus",
68
+ "56": "equus-quagga",
69
+ "57": "eudocimus-albus",
70
+ "58": "eunectes-murinus",
71
+ "59": "falco-peregrinus",
72
+ "60": "felis-catus",
73
+ "61": "formicidae",
74
+ "62": "gallus-gallus-domesticus",
75
+ "63": "gavialis-gangeticus",
76
+ "64": "geococcyx-californianus",
77
+ "65": "giraffa-camelopardalis",
78
+ "66": "gorilla-gorilla",
79
+ "67": "haliaeetus-leucocephalus",
80
+ "68": "hapalochlaena-maculosa",
81
+ "69": "heloderma-suspectum",
82
+ "70": "heterocera",
83
+ "71": "hippopotamus-amphibius",
84
+ "72": "homo-sapiens",
85
+ "73": "hydrurga-leptonyx",
86
+ "74": "icterus-galbula",
87
+ "75": "icterus-gularis",
88
+ "76": "icterus-spurius",
89
+ "77": "iguana-iguana",
90
+ "78": "iguanodon-bernissartensis",
91
+ "79": "inia-geoffrensis",
92
+ "80": "lampropeltis-triangulum",
93
+ "81": "lemur-catta",
94
+ "82": "lepus-americanus",
95
+ "83": "loxodonta-africana",
96
+ "84": "macropus-giganteus",
97
+ "85": "malayopython-reticulatus",
98
+ "86": "mammuthus-primigeniu",
99
+ "87": "martes-americana",
100
+ "88": "megaptera-novaeangliae",
101
+ "89": "melanerpes-carolinus",
102
+ "90": "mellisuga-helenae",
103
+ "91": "mergus-serrator",
104
+ "92": "mimus-polyglottos",
105
+ "93": "monodon-monoceros",
106
+ "94": "musca-domestica",
107
+ "95": "odobenus-rosmarus",
108
+ "96": "okapia-johnstoni",
109
+ "97": "ophiophagus-hannah",
110
+ "98": "orcinus-orca",
111
+ "99": "ornithorhynchus-anatinus",
112
+ "100": "ovis-aries",
113
+ "101": "ovis-canadensis",
114
+ "102": "panthera-leo",
115
+ "103": "panthera-onca",
116
+ "104": "panthera-pardus",
117
+ "105": "panthera-tigris",
118
+ "106": "pantherophis-alleghaniensis",
119
+ "107": "pantherophis-guttatus",
120
+ "108": "papilio-glaucus",
121
+ "109": "passerina-ciris",
122
+ "110": "pavo-cristatus",
123
+ "111": "periplaneta-americana",
124
+ "112": "phascolarctos-cinereus",
125
+ "113": "phoebetria-fusca",
126
+ "114": "phoenicopterus-ruber",
127
+ "115": "phyllobates-terribilis",
128
+ "116": "physalia-physalis",
129
+ "117": "physeter-macrocephalus",
130
+ "118": "poecile-atricapillus",
131
+ "119": "pongo-abelii",
132
+ "120": "procyon-lotor",
133
+ "121": "pteranodon-longiceps",
134
+ "122": "pterois-mombasae",
135
+ "123": "pterois-volitans",
136
+ "124": "puma-concolor",
137
+ "125": "rattus-rattus",
138
+ "126": "rusa-unicolor",
139
+ "127": "salmo-salar",
140
+ "128": "sciurus-carolinensis",
141
+ "129": "smilodon-populator",
142
+ "130": "spheniscus-demersus",
143
+ "131": "sphyrna-mokarran",
144
+ "132": "spinosaurus-aegyptiacus",
145
+ "133": "stegosaurus-stenops",
146
+ "134": "struthio-camelus",
147
+ "135": "tapirus",
148
+ "136": "tarsius-pumilus",
149
+ "137": "taurotragus-oryx",
150
+ "138": "telmatobufo-bullocki",
151
+ "139": "thryothorus-ludovicianus",
152
+ "140": "triceratops-horridus",
153
+ "141": "trilobita",
154
+ "142": "turdus-migratorius",
155
+ "143": "tursiops-truncatus",
156
+ "144": "tyrannosaurus-rex",
157
+ "145": "tyrannus-tyrannus",
158
+ "146": "ursus-arctos-horribilis",
159
+ "147": "ursus-maritimus",
160
+ "148": "varanus-komodoensis",
161
+ "149": "vulpes-vulpes",
162
+ "150": "vultur-gryphus"
163
+ },
164
+ "image_size": 224,
165
+ "initializer_range": 0.02,
166
+ "intermediate_size": 3072,
167
+ "label2id": {
168
+ "acinonyx-jubatus": 0,
169
+ "aethia-cristatella": 1,
170
+ "agalychnis-callidryas": 2,
171
+ "agkistrodon-contortrix": 3,
172
+ "ailuropoda-melanoleuca": 4,
173
+ "ailurus-fulgens": 5,
174
+ "alces-alces": 6,
175
+ "anas-platyrhynchos": 7,
176
+ "ankylosaurus-magniventris": 8,
177
+ "apis-mellifera": 9,
178
+ "aptenodytes-forsteri": 10,
179
+ "aquila-chrysaetos": 11,
180
+ "ara-macao": 12,
181
+ "architeuthis-dux": 13,
182
+ "ardea-herodias": 14,
183
+ "balaenoptera-musculus": 15,
184
+ "betta-splendens": 16,
185
+ "bison-bison": 17,
186
+ "bos-gaurus": 18,
187
+ "bos-taurus": 19,
188
+ "bradypus-variegatus": 20,
189
+ "branta-canadensis": 21,
190
+ "canis-lupus": 22,
191
+ "canis-lupus-familiaris": 23,
192
+ "carcharodon-carcharias": 24,
193
+ "cardinalis-cardinalis": 25,
194
+ "cathartes-aura": 26,
195
+ "centrochelys-sulcata": 27,
196
+ "centruroides-vittatus": 28,
197
+ "ceratitis-capitata": 29,
198
+ "ceratotherium-simum": 30,
199
+ "chelonia-mydas": 31,
200
+ "chrysemys-picta": 32,
201
+ "circus-hudsonius": 33,
202
+ "codium-fragile": 34,
203
+ "coelacanthiformes": 35,
204
+ "colaptes-auratus": 36,
205
+ "connochaetes-gnou": 37,
206
+ "correlophus-ciliatus": 38,
207
+ "crocodylus-niloticus": 39,
208
+ "crotalus-atrox": 40,
209
+ "crotophaga-sulcirostris": 41,
210
+ "cryptoprocta-ferox": 42,
211
+ "cyanocitta-cristata": 43,
212
+ "danaus-plexippus": 44,
213
+ "dasypus-novemcinctus": 45,
214
+ "delphinapterus-leucas": 46,
215
+ "dendrobatidae": 47,
216
+ "dermochelys-coriacea": 48,
217
+ "desmodus-rotundus": 49,
218
+ "diplodocus": 50,
219
+ "dugong-dugon": 51,
220
+ "eidolon-helvum": 52,
221
+ "enhydra-lutris": 53,
222
+ "enteroctopus-dofleini": 54,
223
+ "equus-caballus": 55,
224
+ "equus-quagga": 56,
225
+ "eudocimus-albus": 57,
226
+ "eunectes-murinus": 58,
227
+ "falco-peregrinus": 59,
228
+ "felis-catus": 60,
229
+ "formicidae": 61,
230
+ "gallus-gallus-domesticus": 62,
231
+ "gavialis-gangeticus": 63,
232
+ "geococcyx-californianus": 64,
233
+ "giraffa-camelopardalis": 65,
234
+ "gorilla-gorilla": 66,
235
+ "haliaeetus-leucocephalus": 67,
236
+ "hapalochlaena-maculosa": 68,
237
+ "heloderma-suspectum": 69,
238
+ "heterocera": 70,
239
+ "hippopotamus-amphibius": 71,
240
+ "homo-sapiens": 72,
241
+ "hydrurga-leptonyx": 73,
242
+ "icterus-galbula": 74,
243
+ "icterus-gularis": 75,
244
+ "icterus-spurius": 76,
245
+ "iguana-iguana": 77,
246
+ "iguanodon-bernissartensis": 78,
247
+ "inia-geoffrensis": 79,
248
+ "lampropeltis-triangulum": 80,
249
+ "lemur-catta": 81,
250
+ "lepus-americanus": 82,
251
+ "loxodonta-africana": 83,
252
+ "macropus-giganteus": 84,
253
+ "malayopython-reticulatus": 85,
254
+ "mammuthus-primigeniu": 86,
255
+ "martes-americana": 87,
256
+ "megaptera-novaeangliae": 88,
257
+ "melanerpes-carolinus": 89,
258
+ "mellisuga-helenae": 90,
259
+ "mergus-serrator": 91,
260
+ "mimus-polyglottos": 92,
261
+ "monodon-monoceros": 93,
262
+ "musca-domestica": 94,
263
+ "odobenus-rosmarus": 95,
264
+ "okapia-johnstoni": 96,
265
+ "ophiophagus-hannah": 97,
266
+ "orcinus-orca": 98,
267
+ "ornithorhynchus-anatinus": 99,
268
+ "ovis-aries": 100,
269
+ "ovis-canadensis": 101,
270
+ "panthera-leo": 102,
271
+ "panthera-onca": 103,
272
+ "panthera-pardus": 104,
273
+ "panthera-tigris": 105,
274
+ "pantherophis-alleghaniensis": 106,
275
+ "pantherophis-guttatus": 107,
276
+ "papilio-glaucus": 108,
277
+ "passerina-ciris": 109,
278
+ "pavo-cristatus": 110,
279
+ "periplaneta-americana": 111,
280
+ "phascolarctos-cinereus": 112,
281
+ "phoebetria-fusca": 113,
282
+ "phoenicopterus-ruber": 114,
283
+ "phyllobates-terribilis": 115,
284
+ "physalia-physalis": 116,
285
+ "physeter-macrocephalus": 117,
286
+ "poecile-atricapillus": 118,
287
+ "pongo-abelii": 119,
288
+ "procyon-lotor": 120,
289
+ "pteranodon-longiceps": 121,
290
+ "pterois-mombasae": 122,
291
+ "pterois-volitans": 123,
292
+ "puma-concolor": 124,
293
+ "rattus-rattus": 125,
294
+ "rusa-unicolor": 126,
295
+ "salmo-salar": 127,
296
+ "sciurus-carolinensis": 128,
297
+ "smilodon-populator": 129,
298
+ "spheniscus-demersus": 130,
299
+ "sphyrna-mokarran": 131,
300
+ "spinosaurus-aegyptiacus": 132,
301
+ "stegosaurus-stenops": 133,
302
+ "struthio-camelus": 134,
303
+ "tapirus": 135,
304
+ "tarsius-pumilus": 136,
305
+ "taurotragus-oryx": 137,
306
+ "telmatobufo-bullocki": 138,
307
+ "thryothorus-ludovicianus": 139,
308
+ "triceratops-horridus": 140,
309
+ "trilobita": 141,
310
+ "turdus-migratorius": 142,
311
+ "tursiops-truncatus": 143,
312
+ "tyrannosaurus-rex": 144,
313
+ "tyrannus-tyrannus": 145,
314
+ "ursus-arctos-horribilis": 146,
315
+ "ursus-maritimus": 147,
316
+ "varanus-komodoensis": 148,
317
+ "vulpes-vulpes": 149,
318
+ "vultur-gryphus": 150
319
+ },
320
+ "layer_norm_eps": 1e-12,
321
+ "model_type": "vit",
322
+ "num_attention_heads": 12,
323
+ "num_channels": 3,
324
+ "num_hidden_layers": 12,
325
+ "patch_size": 16,
326
+ "problem_type": "single_label_classification",
327
+ "qkv_bias": true,
328
+ "torch_dtype": "float32",
329
+ "transformers_version": "4.35.2"
330
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13aed8024f292ca6815f925a9d723e2e91ca1e07d8b9f83ae9a783be58c791de
3
+ size 343682308
preprocessor_config.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "do_rescale": true,
4
+ "do_resize": true,
5
+ "image_mean": [
6
+ 0.5,
7
+ 0.5,
8
+ 0.5
9
+ ],
10
+ "image_processor_type": "ViTImageProcessor",
11
+ "image_std": [
12
+ 0.5,
13
+ 0.5,
14
+ 0.5
15
+ ],
16
+ "resample": 2,
17
+ "rescale_factor": 0.00392156862745098,
18
+ "size": {
19
+ "height": 224,
20
+ "width": 224
21
+ }
22
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7e242550be2a583a594f2ba509b483bcf8b85e863a192362f438d02195f34ab
3
+ size 4091