gerald29 commited on
Commit
d33ce80
1 Parent(s): 2cf27eb

Training in progress, epoch 0

Browse files
Files changed (4) hide show
  1. config.json +34 -9
  2. model.safetensors +2 -2
  3. preprocessor_config.json +15 -10
  4. training_args.bin +1 -1
config.json CHANGED
@@ -1,10 +1,11 @@
1
  {
2
- "_name_or_path": "google/vit-base-patch16-224-in21k",
 
3
  "architectures": [
4
- "ViTForImageClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.0,
7
- "encoder_stride": 16,
8
  "hidden_act": "gelu",
9
  "hidden_dropout_prob": 0.0,
10
  "hidden_size": 768,
@@ -111,9 +112,8 @@
111
  "98": "tiramisu",
112
  "99": "tuna_tartare"
113
  },
114
- "image_size": 224,
115
  "initializer_range": 0.02,
116
- "intermediate_size": 3072,
117
  "label2id": {
118
  "apple_pie": "0",
119
  "baby_back_ribs": "1",
@@ -217,14 +217,39 @@
217
  "tuna_tartare": "99",
218
  "waffles": "100"
219
  },
220
- "layer_norm_eps": 1e-12,
221
- "model_type": "vit",
 
 
222
  "num_attention_heads": 12,
223
  "num_channels": 3,
224
  "num_hidden_layers": 12,
225
- "patch_size": 16,
 
 
 
 
 
 
226
  "problem_type": "single_label_classification",
227
  "qkv_bias": true,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
228
  "torch_dtype": "float32",
229
- "transformers_version": "4.45.2"
 
230
  }
 
1
  {
2
+ "_name_or_path": "facebook/dinov2-base-imagenet1k-1-layer",
3
+ "apply_layernorm": true,
4
  "architectures": [
5
+ "Dinov2ForImageClassification"
6
  ],
7
  "attention_probs_dropout_prob": 0.0,
8
+ "drop_path_rate": 0.0,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.0,
11
  "hidden_size": 768,
 
112
  "98": "tiramisu",
113
  "99": "tuna_tartare"
114
  },
115
+ "image_size": 518,
116
  "initializer_range": 0.02,
 
117
  "label2id": {
118
  "apple_pie": "0",
119
  "baby_back_ribs": "1",
 
217
  "tuna_tartare": "99",
218
  "waffles": "100"
219
  },
220
+ "layer_norm_eps": 1e-06,
221
+ "layerscale_value": 1.0,
222
+ "mlp_ratio": 4,
223
+ "model_type": "dinov2",
224
  "num_attention_heads": 12,
225
  "num_channels": 3,
226
  "num_hidden_layers": 12,
227
+ "out_features": [
228
+ "stage12"
229
+ ],
230
+ "out_indices": [
231
+ 12
232
+ ],
233
+ "patch_size": 14,
234
  "problem_type": "single_label_classification",
235
  "qkv_bias": true,
236
+ "reshape_hidden_states": true,
237
+ "stage_names": [
238
+ "stem",
239
+ "stage1",
240
+ "stage2",
241
+ "stage3",
242
+ "stage4",
243
+ "stage5",
244
+ "stage6",
245
+ "stage7",
246
+ "stage8",
247
+ "stage9",
248
+ "stage10",
249
+ "stage11",
250
+ "stage12"
251
+ ],
252
  "torch_dtype": "float32",
253
+ "transformers_version": "4.45.2",
254
+ "use_swiglu_ffn": false
255
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba2153f16139dfcebfa9c9950983678896b77424af76370894f90b3fe1839a04
3
- size 343528508
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05788d610a3673dfd72090b4fa6fa257440732d73dd79e3d2dfab0ad702055a6
3
+ size 346968596
preprocessor_config.json CHANGED
@@ -1,22 +1,27 @@
1
  {
 
 
 
 
 
 
2
  "do_normalize": true,
3
  "do_rescale": true,
4
  "do_resize": true,
5
  "image_mean": [
6
- 0.5,
7
- 0.5,
8
- 0.5
9
  ],
10
- "image_processor_type": "ViTImageProcessor",
11
  "image_std": [
12
- 0.5,
13
- 0.5,
14
- 0.5
15
  ],
16
- "resample": 2,
17
  "rescale_factor": 0.00392156862745098,
18
  "size": {
19
- "height": 224,
20
- "width": 224
21
  }
22
  }
 
1
  {
2
+ "crop_size": {
3
+ "height": 224,
4
+ "width": 224
5
+ },
6
+ "do_center_crop": true,
7
+ "do_convert_rgb": true,
8
  "do_normalize": true,
9
  "do_rescale": true,
10
  "do_resize": true,
11
  "image_mean": [
12
+ 0.485,
13
+ 0.456,
14
+ 0.406
15
  ],
16
+ "image_processor_type": "BitImageProcessor",
17
  "image_std": [
18
+ 0.229,
19
+ 0.224,
20
+ 0.225
21
  ],
22
+ "resample": 3,
23
  "rescale_factor": 0.00392156862745098,
24
  "size": {
25
+ "shortest_edge": 256
 
26
  }
27
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a7eca98acfaf2eeb6c6ef33572fe57afbfb453c99f19e123ddda209efef149f
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c671a5fcbe7d16d79076cb4878b8410ccb68849472fbe6b6c0a22edf7d53fabb
3
  size 5240