s1lv3rj1nx commited on
Commit
2982c17
1 Parent(s): c6a80c2

Upload mask_rcnn_X_101_32x8d_FPN_3x.yml with huggingface_hub

Browse files
Files changed (1) hide show
  1. mask_rcnn_X_101_32x8d_FPN_3x.yml +309 -0
mask_rcnn_X_101_32x8d_FPN_3x.yml ADDED
@@ -0,0 +1,309 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CUDNN_BENCHMARK: false
2
+ DATALOADER:
3
+ ASPECT_RATIO_GROUPING: true
4
+ FILTER_EMPTY_ANNOTATIONS: true
5
+ NUM_WORKERS: 4
6
+ REPEAT_THRESHOLD: 0.0
7
+ SAMPLER_TRAIN: TrainingSampler
8
+ DATASETS:
9
+ PRECOMPUTED_PROPOSAL_TOPK_TEST: 1000
10
+ PRECOMPUTED_PROPOSAL_TOPK_TRAIN: 2000
11
+ PROPOSAL_FILES_TEST: []
12
+ PROPOSAL_FILES_TRAIN: []
13
+ TEST:
14
+ - publaynet-val
15
+ TRAIN:
16
+ - publaynet-train
17
+ GLOBAL:
18
+ HACK: 1.0
19
+ INPUT:
20
+ CROP:
21
+ ENABLED: false
22
+ SIZE:
23
+ - 0.9
24
+ - 0.9
25
+ TYPE: relative_range
26
+ FORMAT: BGR
27
+ MASK_FORMAT: polygon
28
+ MAX_SIZE_TEST: 1333
29
+ MAX_SIZE_TRAIN: 1333
30
+ MIN_SIZE_TEST: 800
31
+ MIN_SIZE_TRAIN:
32
+ - 640
33
+ - 672
34
+ - 704
35
+ - 736
36
+ - 768
37
+ - 800
38
+ MIN_SIZE_TRAIN_SAMPLING: choice
39
+ MODEL:
40
+ ANCHOR_GENERATOR:
41
+ ANGLES:
42
+ - - -90
43
+ - 0
44
+ - 90
45
+ ASPECT_RATIOS:
46
+ - - 0.5
47
+ - 1.0
48
+ - 2.0
49
+ NAME: DefaultAnchorGenerator
50
+ OFFSET: 0.0
51
+ SIZES:
52
+ - - 32
53
+ - - 64
54
+ - - 128
55
+ - - 256
56
+ - - 512
57
+ BACKBONE:
58
+ FREEZE_AT: 2
59
+ NAME: build_resnet_fpn_backbone
60
+ DEVICE: cuda
61
+ FPN:
62
+ FUSE_TYPE: sum
63
+ IN_FEATURES:
64
+ - res2
65
+ - res3
66
+ - res4
67
+ - res5
68
+ NORM: ""
69
+ OUT_CHANNELS: 256
70
+ KEYPOINT_ON: false
71
+ LOAD_PROPOSALS: false
72
+ MASK_ON: true
73
+ META_ARCHITECTURE: GeneralizedRCNN
74
+ PANOPTIC_FPN:
75
+ COMBINE:
76
+ ENABLED: true
77
+ INSTANCES_CONFIDENCE_THRESH: 0.5
78
+ OVERLAP_THRESH: 0.5
79
+ STUFF_AREA_LIMIT: 4096
80
+ INSTANCE_LOSS_WEIGHT: 1.0
81
+ PIXEL_MEAN:
82
+ - 103.53
83
+ - 116.28
84
+ - 123.675
85
+ PIXEL_STD:
86
+ - 57.375
87
+ - 57.12
88
+ - 58.395
89
+ PROPOSAL_GENERATOR:
90
+ MIN_SIZE: 0
91
+ NAME: RPN
92
+ RESNETS:
93
+ DEFORM_MODULATED: false
94
+ DEFORM_NUM_GROUPS: 1
95
+ DEFORM_ON_PER_STAGE:
96
+ - false
97
+ - false
98
+ - false
99
+ - false
100
+ DEPTH: 101
101
+ NORM: FrozenBN
102
+ NUM_GROUPS: 32
103
+ OUT_FEATURES:
104
+ - res2
105
+ - res3
106
+ - res4
107
+ - res5
108
+ RES2_OUT_CHANNELS: 256
109
+ RES5_DILATION: 1
110
+ STEM_OUT_CHANNELS: 64
111
+ STRIDE_IN_1X1: false
112
+ WIDTH_PER_GROUP: 8
113
+ RETINANET:
114
+ BBOX_REG_WEIGHTS:
115
+ - 1.0
116
+ - 1.0
117
+ - 1.0
118
+ - 1.0
119
+ FOCAL_LOSS_ALPHA: 0.25
120
+ FOCAL_LOSS_GAMMA: 2.0
121
+ IN_FEATURES:
122
+ - p3
123
+ - p4
124
+ - p5
125
+ - p6
126
+ - p7
127
+ IOU_LABELS:
128
+ - 0
129
+ - -1
130
+ - 1
131
+ IOU_THRESHOLDS:
132
+ - 0.4
133
+ - 0.5
134
+ NMS_THRESH_TEST: 0.5
135
+ NUM_CLASSES: 80
136
+ NUM_CONVS: 4
137
+ PRIOR_PROB: 0.01
138
+ SCORE_THRESH_TEST: 0.05
139
+ SMOOTH_L1_LOSS_BETA: 0.1
140
+ TOPK_CANDIDATES_TEST: 1000
141
+ ROI_BOX_CASCADE_HEAD:
142
+ BBOX_REG_WEIGHTS:
143
+ - - 10.0
144
+ - 10.0
145
+ - 5.0
146
+ - 5.0
147
+ - - 20.0
148
+ - 20.0
149
+ - 10.0
150
+ - 10.0
151
+ - - 30.0
152
+ - 30.0
153
+ - 15.0
154
+ - 15.0
155
+ IOUS:
156
+ - 0.5
157
+ - 0.6
158
+ - 0.7
159
+ ROI_BOX_HEAD:
160
+ BBOX_REG_WEIGHTS:
161
+ - 10.0
162
+ - 10.0
163
+ - 5.0
164
+ - 5.0
165
+ CLS_AGNOSTIC_BBOX_REG: false
166
+ CONV_DIM: 256
167
+ FC_DIM: 1024
168
+ NAME: FastRCNNConvFCHead
169
+ NORM: ""
170
+ NUM_CONV: 0
171
+ NUM_FC: 2
172
+ POOLER_RESOLUTION: 7
173
+ POOLER_SAMPLING_RATIO: 0
174
+ POOLER_TYPE: ROIAlignV2
175
+ SMOOTH_L1_BETA: 0.0
176
+ TRAIN_ON_PRED_BOXES: false
177
+ ROI_HEADS:
178
+ BATCH_SIZE_PER_IMAGE: 512
179
+ IN_FEATURES:
180
+ - p2
181
+ - p3
182
+ - p4
183
+ - p5
184
+ IOU_LABELS:
185
+ - 0
186
+ - 1
187
+ IOU_THRESHOLDS:
188
+ - 0.5
189
+ NAME: StandardROIHeads
190
+ NMS_THRESH_TEST: 0.5
191
+ NUM_CLASSES: 5
192
+ POSITIVE_FRACTION: 0.25
193
+ PROPOSAL_APPEND_GT: true
194
+ SCORE_THRESH_TEST: 0.05
195
+ ROI_KEYPOINT_HEAD:
196
+ CONV_DIMS:
197
+ - 512
198
+ - 512
199
+ - 512
200
+ - 512
201
+ - 512
202
+ - 512
203
+ - 512
204
+ - 512
205
+ LOSS_WEIGHT: 1.0
206
+ MIN_KEYPOINTS_PER_IMAGE: 1
207
+ NAME: KRCNNConvDeconvUpsampleHead
208
+ NORMALIZE_LOSS_BY_VISIBLE_KEYPOINTS: true
209
+ NUM_KEYPOINTS: 17
210
+ POOLER_RESOLUTION: 14
211
+ POOLER_SAMPLING_RATIO: 0
212
+ POOLER_TYPE: ROIAlignV2
213
+ ROI_MASK_HEAD:
214
+ CLS_AGNOSTIC_MASK: false
215
+ CONV_DIM: 256
216
+ NAME: MaskRCNNConvUpsampleHead
217
+ NORM: ""
218
+ NUM_CONV: 4
219
+ POOLER_RESOLUTION: 14
220
+ POOLER_SAMPLING_RATIO: 0
221
+ POOLER_TYPE: ROIAlignV2
222
+ RPN:
223
+ BATCH_SIZE_PER_IMAGE: 256
224
+ BBOX_REG_WEIGHTS:
225
+ - 1.0
226
+ - 1.0
227
+ - 1.0
228
+ - 1.0
229
+ BOUNDARY_THRESH: -1
230
+ HEAD_NAME: StandardRPNHead
231
+ IN_FEATURES:
232
+ - p2
233
+ - p3
234
+ - p4
235
+ - p5
236
+ - p6
237
+ IOU_LABELS:
238
+ - 0
239
+ - -1
240
+ - 1
241
+ IOU_THRESHOLDS:
242
+ - 0.3
243
+ - 0.7
244
+ LOSS_WEIGHT: 1.0
245
+ NMS_THRESH: 0.7
246
+ POSITIVE_FRACTION: 0.5
247
+ POST_NMS_TOPK_TEST: 1000
248
+ POST_NMS_TOPK_TRAIN: 1000
249
+ PRE_NMS_TOPK_TEST: 1000
250
+ PRE_NMS_TOPK_TRAIN: 2000
251
+ SMOOTH_L1_BETA: 0.0
252
+ SEM_SEG_HEAD:
253
+ COMMON_STRIDE: 4
254
+ CONVS_DIM: 128
255
+ IGNORE_VALUE: 255
256
+ IN_FEATURES:
257
+ - p2
258
+ - p3
259
+ - p4
260
+ - p5
261
+ LOSS_WEIGHT: 1.0
262
+ NAME: SemSegFPNHead
263
+ NORM: GN
264
+ NUM_CLASSES: 54
265
+ WEIGHTS: https://www.dropbox.com/s/57zjbwv6gh3srry/model_final.pth?dl=1
266
+ OUTPUT_DIR: ../outputs/publaynet/mask_rcnn_X_101_32x8d_FPN_3x/
267
+ SEED: -1
268
+ SOLVER:
269
+ BASE_LR: 0.0005
270
+ BIAS_LR_FACTOR: 1.0
271
+ CHECKPOINT_PERIOD: 60000
272
+ GAMMA: 0.1
273
+ IMS_PER_BATCH: 2
274
+ LR_SCHEDULER_NAME: WarmupMultiStepLR
275
+ MAX_ITER: 180000
276
+ MOMENTUM: 0.9
277
+ STEPS:
278
+ - 210000
279
+ - 250000
280
+ WARMUP_FACTOR: 0.001
281
+ WARMUP_ITERS: 1000
282
+ WARMUP_METHOD: linear
283
+ WEIGHT_DECAY: 0.0001
284
+ WEIGHT_DECAY_BIAS: 0.0001
285
+ WEIGHT_DECAY_NORM: 0.0
286
+ TEST:
287
+ AUG:
288
+ ENABLED: false
289
+ FLIP: true
290
+ MAX_SIZE: 4000
291
+ MIN_SIZES:
292
+ - 400
293
+ - 500
294
+ - 600
295
+ - 700
296
+ - 800
297
+ - 900
298
+ - 1000
299
+ - 1100
300
+ - 1200
301
+ DETECTIONS_PER_IMAGE: 100
302
+ EVAL_PERIOD: 0
303
+ EXPECTED_RESULTS: []
304
+ KEYPOINT_OKS_SIGMAS: []
305
+ PRECISE_BN:
306
+ ENABLED: false
307
+ NUM_ITER: 200
308
+ VERSION: 2
309
+ VIS_PERIOD: 0