nathanReitinger commited on
Commit
75315df
1 Parent(s): b00b9f1

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,13 +1,8 @@
1
  {
2
- "_name_or_path": "google/vit-huge-patch14-224-in21k",
3
  "architectures": [
4
- "ViTForImageClassification"
5
  ],
6
- "attention_probs_dropout_prob": 0.0,
7
- "encoder_stride": 16,
8
- "hidden_act": "gelu",
9
- "hidden_dropout_prob": 0.0,
10
- "hidden_size": 1280,
11
  "id2label": {
12
  "0": "T - shirt / top",
13
  "1": "Trouser",
@@ -20,9 +15,7 @@
20
  "8": "Bag",
21
  "9": "Ankle boot"
22
  },
23
- "image_size": 224,
24
- "initializer_range": 0.02,
25
- "intermediate_size": 5120,
26
  "label2id": {
27
  "Ankle boot": "9",
28
  "Bag": "8",
@@ -35,14 +28,28 @@
35
  "T - shirt / top": "0",
36
  "Trouser": "1"
37
  },
38
- "layer_norm_eps": 1e-12,
39
- "model_type": "vit",
40
- "num_attention_heads": 16,
41
- "num_channels": 3,
42
- "num_hidden_layers": 32,
43
- "patch_size": 14,
44
  "problem_type": "single_label_classification",
45
- "qkv_bias": true,
 
 
 
 
 
 
 
 
46
  "torch_dtype": "float32",
47
- "transformers_version": "4.40.1"
 
 
 
 
 
 
 
 
 
 
48
  }
 
1
  {
2
+ "_name_or_path": "openai/clip-vit-large-patch14",
3
  "architectures": [
4
+ "CLIPForImageClassification"
5
  ],
 
 
 
 
 
6
  "id2label": {
7
  "0": "T - shirt / top",
8
  "1": "Trouser",
 
15
  "8": "Bag",
16
  "9": "Ankle boot"
17
  },
18
+ "initializer_factor": 1.0,
 
 
19
  "label2id": {
20
  "Ankle boot": "9",
21
  "Bag": "8",
 
28
  "T - shirt / top": "0",
29
  "Trouser": "1"
30
  },
31
+ "logit_scale_init_value": 2.6592,
32
+ "model_type": "clip",
 
 
 
 
33
  "problem_type": "single_label_classification",
34
+ "projection_dim": 768,
35
+ "text_config": {
36
+ "dropout": 0.0,
37
+ "hidden_size": 768,
38
+ "intermediate_size": 3072,
39
+ "model_type": "clip_text_model",
40
+ "num_attention_heads": 12,
41
+ "projection_dim": 768
42
+ },
43
  "torch_dtype": "float32",
44
+ "transformers_version": "4.40.1",
45
+ "vision_config": {
46
+ "dropout": 0.0,
47
+ "hidden_size": 1024,
48
+ "intermediate_size": 4096,
49
+ "model_type": "clip_vision_model",
50
+ "num_attention_heads": 16,
51
+ "num_hidden_layers": 24,
52
+ "patch_size": 14,
53
+ "projection_dim": 768
54
+ }
55
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba03e37f14b905521bd0492ec29cc1cc4c5f68a441e08575c43823990eed48d8
3
- size 2523172784
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b17376300f470619db67a6d721eb61e1cc5bb9dfa3d74b514bcf431143c8a29
3
+ size 1212808056
preprocessor_config.json CHANGED
@@ -4,33 +4,41 @@
4
  "do_resize",
5
  "size",
6
  "resample",
 
 
7
  "do_rescale",
8
  "rescale_factor",
9
  "do_normalize",
10
  "image_mean",
11
  "image_std",
 
12
  "return_tensors",
13
  "data_format",
14
  "input_data_format"
15
  ],
 
 
 
 
 
 
16
  "do_normalize": true,
17
  "do_rescale": true,
18
  "do_resize": true,
19
  "image_mean": [
20
- 0.5,
21
- 0.5,
22
- 0.5
23
  ],
24
- "image_processor_type": "ViTImageProcessor",
25
  "image_std": [
26
- 0.5,
27
- 0.5,
28
- 0.5
29
  ],
30
- "resample": 2,
31
  "rescale_factor": 0.00392156862745098,
32
  "size": {
33
- "height": 224,
34
- "width": 224
35
  }
36
  }
 
4
  "do_resize",
5
  "size",
6
  "resample",
7
+ "do_center_crop",
8
+ "crop_size",
9
  "do_rescale",
10
  "rescale_factor",
11
  "do_normalize",
12
  "image_mean",
13
  "image_std",
14
+ "do_convert_rgb",
15
  "return_tensors",
16
  "data_format",
17
  "input_data_format"
18
  ],
19
+ "crop_size": {
20
+ "height": 224,
21
+ "width": 224
22
+ },
23
+ "do_center_crop": true,
24
+ "do_convert_rgb": true,
25
  "do_normalize": true,
26
  "do_rescale": true,
27
  "do_resize": true,
28
  "image_mean": [
29
+ 0.48145466,
30
+ 0.4578275,
31
+ 0.40821073
32
  ],
33
+ "image_processor_type": "CLIPImageProcessor",
34
  "image_std": [
35
+ 0.26862954,
36
+ 0.26130258,
37
+ 0.27577711
38
  ],
39
+ "resample": 3,
40
  "rescale_factor": 0.00392156862745098,
41
  "size": {
42
+ "shortest_edge": 224
 
43
  }
44
  }
runs/May04_00-26-56_tron60.umiacs.umd.edu/events.out.tfevents.1714796818.tron60.umiacs.umd.edu.188383.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b41e905342b4a52f7a25128670d3efc797ca080c68db2b1f9bfaae1f9fcf41be
3
+ size 13675
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f8793ffc32dbae6f2b33dad465b4561a1516d90336345731faae32e44945f9e
3
  size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:686189be16b394f2cea6dd364d97575f2d95d1c28a54e0f3e8e71a052d6952f8
3
  size 5048