EduardoPacheco commited on
Commit
59cc2b0
1 Parent(s): 06fa2e0

Upload GroundingDinoForObjectDetection

Browse files
Files changed (2) hide show
  1. config.json +26 -15
  2. model.safetensors +3 -0
config.json CHANGED
@@ -2,18 +2,28 @@
2
  "activation_dropout": 0.0,
3
  "activation_function": "relu",
4
  "architectures": [
5
- "GroundingDINOForObjectDetection"
6
  ],
7
  "attention_dropout": 0.0,
8
  "auxiliary_loss": false,
9
- "backbone": "swin",
10
  "backbone_config": {
 
11
  "depths": [
12
  2,
13
  2,
14
  6,
15
  2
16
  ],
 
 
 
 
 
 
 
 
 
 
17
  "model_type": "swin",
18
  "num_heads": [
19
  3,
@@ -21,6 +31,7 @@
21
  12,
22
  24
23
  ],
 
24
  "out_features": [
25
  "stage2",
26
  "stage3",
@@ -30,18 +41,21 @@
30
  2,
31
  3,
32
  4
33
- ]
 
 
 
 
34
  },
35
- "bbox_cost": 5,
36
- "bbox_loss_coefficient": 5,
37
- "class_cost": 1,
38
  "d_model": 256,
39
  "decoder_attention_heads": 8,
40
  "decoder_bbox_embed_share": true,
41
  "decoder_ffn_dim": 2048,
42
  "decoder_layers": 6,
43
  "decoder_n_points": 4,
44
- "dilation": false,
45
  "disable_custom_kernels": false,
46
  "dropout": 0.1,
47
  "embedding_init_target": true,
@@ -52,12 +66,12 @@
52
  "focal_alpha": 0.25,
53
  "fusion_dropout": 0.0,
54
  "fusion_droppath": 0.1,
55
- "giou_cost": 2,
56
- "giou_loss_coefficient": 2,
 
57
  "is_encoder_decoder": true,
58
  "max_text_len": 256,
59
  "model_type": "grounding-dino",
60
- "num_channels": 3,
61
  "num_feature_levels": 4,
62
  "num_queries": 900,
63
  "position_embedding_type": "sine",
@@ -68,10 +82,7 @@
68
  },
69
  "text_enhancer_dropout": 0.0,
70
  "torch_dtype": "float32",
71
- "transformers_version": "4.35.0.dev0",
72
  "two_stage": true,
73
- "two_stage_bbox_embed_share": false,
74
- "use_pretrained_backbone": true,
75
- "use_timm_backbone": false,
76
- "with_box_refine": true
77
  }
 
2
  "activation_dropout": 0.0,
3
  "activation_function": "relu",
4
  "architectures": [
5
+ "GroundingDinoForObjectDetection"
6
  ],
7
  "attention_dropout": 0.0,
8
  "auxiliary_loss": false,
 
9
  "backbone_config": {
10
+ "attention_probs_dropout_prob": 0.0,
11
  "depths": [
12
  2,
13
  2,
14
  6,
15
  2
16
  ],
17
+ "drop_path_rate": 0.1,
18
+ "embed_dim": 96,
19
+ "encoder_stride": 32,
20
+ "hidden_act": "gelu",
21
+ "hidden_dropout_prob": 0.0,
22
+ "hidden_size": 768,
23
+ "image_size": 224,
24
+ "initializer_range": 0.02,
25
+ "layer_norm_eps": 1e-05,
26
+ "mlp_ratio": 4.0,
27
  "model_type": "swin",
28
  "num_heads": [
29
  3,
 
31
  12,
32
  24
33
  ],
34
+ "num_layers": 4,
35
  "out_features": [
36
  "stage2",
37
  "stage3",
 
41
  2,
42
  3,
43
  4
44
+ ],
45
+ "patch_size": 4,
46
+ "qkv_bias": true,
47
+ "use_absolute_embeddings": false,
48
+ "window_size": 7
49
  },
50
+ "bbox_cost": 5.0,
51
+ "bbox_loss_coefficient": 5.0,
52
+ "class_cost": 1.0,
53
  "d_model": 256,
54
  "decoder_attention_heads": 8,
55
  "decoder_bbox_embed_share": true,
56
  "decoder_ffn_dim": 2048,
57
  "decoder_layers": 6,
58
  "decoder_n_points": 4,
 
59
  "disable_custom_kernels": false,
60
  "dropout": 0.1,
61
  "embedding_init_target": true,
 
66
  "focal_alpha": 0.25,
67
  "fusion_dropout": 0.0,
68
  "fusion_droppath": 0.1,
69
+ "giou_cost": 2.0,
70
+ "giou_loss_coefficient": 2.0,
71
+ "init_std": 0.02,
72
  "is_encoder_decoder": true,
73
  "max_text_len": 256,
74
  "model_type": "grounding-dino",
 
75
  "num_feature_levels": 4,
76
  "num_queries": 900,
77
  "position_embedding_type": "sine",
 
82
  },
83
  "text_enhancer_dropout": 0.0,
84
  "torch_dtype": "float32",
85
+ "transformers_version": "4.36.0.dev0",
86
  "two_stage": true,
87
+ "two_stage_bbox_embed_share": false
 
 
 
88
  }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1519d39d48a5409cd53831a5ca73397224834a0f76ecd4a9f51630012d4f9af8
3
+ size 691712888