shubhamWi91 commited on
Commit
524d215
1 Parent(s): 168ef88

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,31 +1,73 @@
1
  {
2
- "_name_or_path": "facebook/detr-resnet-101",
3
  "activation_dropout": 0.0,
4
  "activation_function": "relu",
5
  "architectures": [
6
- "DetrForObjectDetection"
7
  ],
 
8
  "attention_dropout": 0.0,
9
  "auxiliary_loss": false,
10
- "backbone": "resnet101",
11
- "backbone_config": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  "bbox_cost": 5,
13
  "bbox_loss_coefficient": 5,
14
  "class_cost": 1,
15
- "classifier_dropout": 0.0,
16
  "d_model": 256,
17
  "decoder_attention_heads": 8,
18
  "decoder_ffn_dim": 2048,
19
  "decoder_layerdrop": 0.0,
20
  "decoder_layers": 6,
 
21
  "dice_loss_coefficient": 1,
22
- "dilation": false,
23
  "dropout": 0.1,
24
  "encoder_attention_heads": 8,
25
  "encoder_ffn_dim": 2048,
26
  "encoder_layerdrop": 0.0,
27
  "encoder_layers": 6,
 
28
  "eos_coefficient": 0.1,
 
29
  "giou_cost": 2,
30
  "giou_loss_coefficient": 2,
31
  "id2label": {
@@ -66,15 +108,14 @@
66
  "tetrapack": 13
67
  },
68
  "mask_loss_coefficient": 1,
69
- "max_position_embeddings": 1024,
70
- "model_type": "detr",
71
- "num_channels": 3,
72
- "num_hidden_layers": 6,
73
- "num_queries": 100,
74
  "position_embedding_type": "sine",
75
- "scale_embedding": false,
76
  "torch_dtype": "float32",
77
  "transformers_version": "4.32.1",
78
- "use_pretrained_backbone": true,
79
- "use_timm_backbone": true
 
80
  }
 
1
  {
2
+ "_name_or_path": "jozhang97/deta-swin-large-o365",
3
  "activation_dropout": 0.0,
4
  "activation_function": "relu",
5
  "architectures": [
6
+ "DetaForObjectDetection"
7
  ],
8
+ "assign_first_stage": true,
9
  "attention_dropout": 0.0,
10
  "auxiliary_loss": false,
11
+ "backbone_config": {
12
+ "attention_probs_dropout_prob": 0.0,
13
+ "depths": [
14
+ 2,
15
+ 2,
16
+ 18,
17
+ 2
18
+ ],
19
+ "drop_path_rate": 0.1,
20
+ "embed_dim": 192,
21
+ "encoder_stride": 32,
22
+ "hidden_act": "gelu",
23
+ "hidden_dropout_prob": 0.0,
24
+ "hidden_size": 1536,
25
+ "image_size": 224,
26
+ "initializer_range": 0.02,
27
+ "layer_norm_eps": 1e-05,
28
+ "mlp_ratio": 4.0,
29
+ "model_type": "swin",
30
+ "num_heads": [
31
+ 6,
32
+ 12,
33
+ 24,
34
+ 48
35
+ ],
36
+ "num_layers": 4,
37
+ "out_features": [
38
+ "stage2",
39
+ "stage3",
40
+ "stage4"
41
+ ],
42
+ "out_indices": [
43
+ 2,
44
+ 3,
45
+ 4
46
+ ],
47
+ "patch_size": 4,
48
+ "path_norm": true,
49
+ "qkv_bias": true,
50
+ "use_absolute_embeddings": false,
51
+ "window_size": 12
52
+ },
53
  "bbox_cost": 5,
54
  "bbox_loss_coefficient": 5,
55
  "class_cost": 1,
 
56
  "d_model": 256,
57
  "decoder_attention_heads": 8,
58
  "decoder_ffn_dim": 2048,
59
  "decoder_layerdrop": 0.0,
60
  "decoder_layers": 6,
61
+ "decoder_n_points": 4,
62
  "dice_loss_coefficient": 1,
 
63
  "dropout": 0.1,
64
  "encoder_attention_heads": 8,
65
  "encoder_ffn_dim": 2048,
66
  "encoder_layerdrop": 0.0,
67
  "encoder_layers": 6,
68
+ "encoder_n_points": 4,
69
  "eos_coefficient": 0.1,
70
+ "focal_alpha": 0.25,
71
  "giou_cost": 2,
72
  "giou_loss_coefficient": 2,
73
  "id2label": {
 
108
  "tetrapack": 13
109
  },
110
  "mask_loss_coefficient": 1,
111
+ "max_position_embeddings": 2048,
112
+ "model_type": "deta",
113
+ "num_feature_levels": 5,
114
+ "num_queries": 900,
 
115
  "position_embedding_type": "sine",
 
116
  "torch_dtype": "float32",
117
  "transformers_version": "4.32.1",
118
+ "two_stage": true,
119
+ "two_stage_num_proposals": 300,
120
+ "with_box_refine": true
121
  }
preprocessor_config.json CHANGED
@@ -9,7 +9,7 @@
9
  0.456,
10
  0.406
11
  ],
12
- "image_processor_type": "DetrImageProcessor",
13
  "image_std": [
14
  0.229,
15
  0.224,
 
9
  0.456,
10
  0.406
11
  ],
12
+ "image_processor_type": "DetaImageProcessor",
13
  "image_std": [
14
  0.229,
15
  0.224,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90b1c82815e35691f33e30d33f305abfacfc78667371f851b58632c3bc2bf4da
3
- size 242896657
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57e210fd0054426a510038426d8cd21c90103942374515cc77977d32261b5a54
3
+ size 878823725
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ebcb26d456cb44e53539e99eb331df283870c522bf79e4adfcfed49f50b71c79
3
  size 4091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff56f69fa7155045e6f3b027f175f4731b06edd1f187984d2fef18bc986e0fa4
3
  size 4091