Joshua Lochner commited on
Commit
e3dc3e6
1 Parent(s): bbff979

Add `detr-resnet-50-panoptic` for image-segmentation

Browse files

NOTE: This is actually the unquantized model. The quantized model is very inaccurate. However, the way the library currently works, I can't specify to use the unquantized version by default.

quantized/facebook/detr-resnet-50-panoptic/image-segmentation/config.json ADDED
@@ -0,0 +1,550 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_commit_hash": "060ed34a4a3501c5e8a328c69862871c2e242016",
3
+ "_name_or_path": "facebook/detr-resnet-50-panoptic",
4
+ "activation_dropout": 0.0,
5
+ "activation_function": "relu",
6
+ "architectures": [
7
+ "DetrForSegmentation"
8
+ ],
9
+ "attention_dropout": 0.0,
10
+ "auxiliary_loss": false,
11
+ "backbone": "resnet50",
12
+ "backbone_config": null,
13
+ "bbox_cost": 5,
14
+ "bbox_loss_coefficient": 5,
15
+ "class_cost": 1,
16
+ "classifier_dropout": 0.0,
17
+ "d_model": 256,
18
+ "decoder_attention_heads": 8,
19
+ "decoder_ffn_dim": 2048,
20
+ "decoder_layerdrop": 0.0,
21
+ "decoder_layers": 6,
22
+ "dice_loss_coefficient": 1,
23
+ "dilation": false,
24
+ "dropout": 0.1,
25
+ "encoder_attention_heads": 8,
26
+ "encoder_ffn_dim": 2048,
27
+ "encoder_layerdrop": 0.0,
28
+ "encoder_layers": 6,
29
+ "eos_coefficient": 0.1,
30
+ "giou_cost": 2,
31
+ "giou_loss_coefficient": 2,
32
+ "id2label": {
33
+ "0": "N/A",
34
+ "1": "person",
35
+ "2": "bicycle",
36
+ "3": "car",
37
+ "4": "motorcycle",
38
+ "5": "airplane",
39
+ "6": "bus",
40
+ "7": "train",
41
+ "8": "truck",
42
+ "9": "boat",
43
+ "10": "traffic light",
44
+ "11": "fire hydrant",
45
+ "12": "street sign",
46
+ "13": "stop sign",
47
+ "14": "parking meter",
48
+ "15": "bench",
49
+ "16": "bird",
50
+ "17": "cat",
51
+ "18": "dog",
52
+ "19": "horse",
53
+ "20": "sheep",
54
+ "21": "cow",
55
+ "22": "elephant",
56
+ "23": "bear",
57
+ "24": "zebra",
58
+ "25": "giraffe",
59
+ "26": "hat",
60
+ "27": "backpack",
61
+ "28": "umbrella",
62
+ "29": "shoe",
63
+ "30": "eye glasses",
64
+ "31": "handbag",
65
+ "32": "tie",
66
+ "33": "suitcase",
67
+ "34": "frisbee",
68
+ "35": "skis",
69
+ "36": "snowboard",
70
+ "37": "sports ball",
71
+ "38": "kite",
72
+ "39": "baseball bat",
73
+ "40": "baseball glove",
74
+ "41": "skateboard",
75
+ "42": "surfboard",
76
+ "43": "tennis racket",
77
+ "44": "bottle",
78
+ "45": "plate",
79
+ "46": "wine glass",
80
+ "47": "cup",
81
+ "48": "fork",
82
+ "49": "knife",
83
+ "50": "spoon",
84
+ "51": "bowl",
85
+ "52": "banana",
86
+ "53": "apple",
87
+ "54": "sandwich",
88
+ "55": "orange",
89
+ "56": "broccoli",
90
+ "57": "carrot",
91
+ "58": "hot dog",
92
+ "59": "pizza",
93
+ "60": "donut",
94
+ "61": "cake",
95
+ "62": "chair",
96
+ "63": "couch",
97
+ "64": "potted plant",
98
+ "65": "bed",
99
+ "66": "mirror",
100
+ "67": "dining table",
101
+ "68": "window",
102
+ "69": "desk",
103
+ "70": "toilet",
104
+ "71": "door",
105
+ "72": "tv",
106
+ "73": "laptop",
107
+ "74": "mouse",
108
+ "75": "remote",
109
+ "76": "keyboard",
110
+ "77": "cell phone",
111
+ "78": "microwave",
112
+ "79": "oven",
113
+ "80": "toaster",
114
+ "81": "sink",
115
+ "82": "refrigerator",
116
+ "83": "blender",
117
+ "84": "book",
118
+ "85": "clock",
119
+ "86": "vase",
120
+ "87": "scissors",
121
+ "88": "teddy bear",
122
+ "89": "hair drier",
123
+ "90": "toothbrush",
124
+ "91": "hair brush",
125
+ "92": "banner",
126
+ "93": "blanket",
127
+ "94": "branch",
128
+ "95": "bridge",
129
+ "96": "building-other",
130
+ "97": "bush",
131
+ "98": "cabinet",
132
+ "99": "cage",
133
+ "100": "cardboard",
134
+ "101": "carpet",
135
+ "102": "ceiling-other",
136
+ "103": "ceiling-tile",
137
+ "104": "cloth",
138
+ "105": "clothes",
139
+ "106": "clouds",
140
+ "107": "counter",
141
+ "108": "cupboard",
142
+ "109": "curtain",
143
+ "110": "desk-stuff",
144
+ "111": "dirt",
145
+ "112": "door-stuff",
146
+ "113": "fence",
147
+ "114": "floor-marble",
148
+ "115": "floor-other",
149
+ "116": "floor-stone",
150
+ "117": "floor-tile",
151
+ "118": "floor-wood",
152
+ "119": "flower",
153
+ "120": "fog",
154
+ "121": "food-other",
155
+ "122": "fruit",
156
+ "123": "furniture-other",
157
+ "124": "grass",
158
+ "125": "gravel",
159
+ "126": "ground-other",
160
+ "127": "hill",
161
+ "128": "house",
162
+ "129": "leaves",
163
+ "130": "light",
164
+ "131": "mat",
165
+ "132": "metal",
166
+ "133": "mirror-stuff",
167
+ "134": "moss",
168
+ "135": "mountain",
169
+ "136": "mud",
170
+ "137": "napkin",
171
+ "138": "net",
172
+ "139": "paper",
173
+ "140": "pavement",
174
+ "141": "pillow",
175
+ "142": "plant-other",
176
+ "143": "plastic",
177
+ "144": "platform",
178
+ "145": "playingfield",
179
+ "146": "railing",
180
+ "147": "railroad",
181
+ "148": "river",
182
+ "149": "road",
183
+ "150": "rock",
184
+ "151": "roof",
185
+ "152": "rug",
186
+ "153": "salad",
187
+ "154": "sand",
188
+ "155": "sea",
189
+ "156": "shelf",
190
+ "157": "sky-other",
191
+ "158": "skyscraper",
192
+ "159": "snow",
193
+ "160": "solid-other",
194
+ "161": "stairs",
195
+ "162": "stone",
196
+ "163": "straw",
197
+ "164": "structural-other",
198
+ "165": "table",
199
+ "166": "tent",
200
+ "167": "textile-other",
201
+ "168": "towel",
202
+ "169": "tree",
203
+ "170": "vegetable",
204
+ "171": "wall-brick",
205
+ "172": "wall-concrete",
206
+ "173": "wall-other",
207
+ "174": "wall-panel",
208
+ "175": "wall-stone",
209
+ "176": "wall-tile",
210
+ "177": "wall-wood",
211
+ "178": "water-other",
212
+ "179": "waterdrops",
213
+ "180": "window-blind",
214
+ "181": "window-other",
215
+ "182": "wood",
216
+ "183": "LABEL_183",
217
+ "184": "LABEL_184",
218
+ "185": "LABEL_185",
219
+ "186": "LABEL_186",
220
+ "187": "LABEL_187",
221
+ "188": "LABEL_188",
222
+ "189": "LABEL_189",
223
+ "190": "LABEL_190",
224
+ "191": "LABEL_191",
225
+ "192": "LABEL_192",
226
+ "193": "LABEL_193",
227
+ "194": "LABEL_194",
228
+ "195": "LABEL_195",
229
+ "196": "LABEL_196",
230
+ "197": "LABEL_197",
231
+ "198": "LABEL_198",
232
+ "199": "LABEL_199",
233
+ "200": "LABEL_200",
234
+ "201": "LABEL_201",
235
+ "202": "LABEL_202",
236
+ "203": "LABEL_203",
237
+ "204": "LABEL_204",
238
+ "205": "LABEL_205",
239
+ "206": "LABEL_206",
240
+ "207": "LABEL_207",
241
+ "208": "LABEL_208",
242
+ "209": "LABEL_209",
243
+ "210": "LABEL_210",
244
+ "211": "LABEL_211",
245
+ "212": "LABEL_212",
246
+ "213": "LABEL_213",
247
+ "214": "LABEL_214",
248
+ "215": "LABEL_215",
249
+ "216": "LABEL_216",
250
+ "217": "LABEL_217",
251
+ "218": "LABEL_218",
252
+ "219": "LABEL_219",
253
+ "220": "LABEL_220",
254
+ "221": "LABEL_221",
255
+ "222": "LABEL_222",
256
+ "223": "LABEL_223",
257
+ "224": "LABEL_224",
258
+ "225": "LABEL_225",
259
+ "226": "LABEL_226",
260
+ "227": "LABEL_227",
261
+ "228": "LABEL_228",
262
+ "229": "LABEL_229",
263
+ "230": "LABEL_230",
264
+ "231": "LABEL_231",
265
+ "232": "LABEL_232",
266
+ "233": "LABEL_233",
267
+ "234": "LABEL_234",
268
+ "235": "LABEL_235",
269
+ "236": "LABEL_236",
270
+ "237": "LABEL_237",
271
+ "238": "LABEL_238",
272
+ "239": "LABEL_239",
273
+ "240": "LABEL_240",
274
+ "241": "LABEL_241",
275
+ "242": "LABEL_242",
276
+ "243": "LABEL_243",
277
+ "244": "LABEL_244",
278
+ "245": "LABEL_245",
279
+ "246": "LABEL_246",
280
+ "247": "LABEL_247",
281
+ "248": "LABEL_248",
282
+ "249": "LABEL_249"
283
+ },
284
+ "init_std": 0.02,
285
+ "init_xavier_std": 1.0,
286
+ "is_encoder_decoder": true,
287
+ "label2id": {
288
+ "LABEL_183": 183,
289
+ "LABEL_184": 184,
290
+ "LABEL_185": 185,
291
+ "LABEL_186": 186,
292
+ "LABEL_187": 187,
293
+ "LABEL_188": 188,
294
+ "LABEL_189": 189,
295
+ "LABEL_190": 190,
296
+ "LABEL_191": 191,
297
+ "LABEL_192": 192,
298
+ "LABEL_193": 193,
299
+ "LABEL_194": 194,
300
+ "LABEL_195": 195,
301
+ "LABEL_196": 196,
302
+ "LABEL_197": 197,
303
+ "LABEL_198": 198,
304
+ "LABEL_199": 199,
305
+ "LABEL_200": 200,
306
+ "LABEL_201": 201,
307
+ "LABEL_202": 202,
308
+ "LABEL_203": 203,
309
+ "LABEL_204": 204,
310
+ "LABEL_205": 205,
311
+ "LABEL_206": 206,
312
+ "LABEL_207": 207,
313
+ "LABEL_208": 208,
314
+ "LABEL_209": 209,
315
+ "LABEL_210": 210,
316
+ "LABEL_211": 211,
317
+ "LABEL_212": 212,
318
+ "LABEL_213": 213,
319
+ "LABEL_214": 214,
320
+ "LABEL_215": 215,
321
+ "LABEL_216": 216,
322
+ "LABEL_217": 217,
323
+ "LABEL_218": 218,
324
+ "LABEL_219": 219,
325
+ "LABEL_220": 220,
326
+ "LABEL_221": 221,
327
+ "LABEL_222": 222,
328
+ "LABEL_223": 223,
329
+ "LABEL_224": 224,
330
+ "LABEL_225": 225,
331
+ "LABEL_226": 226,
332
+ "LABEL_227": 227,
333
+ "LABEL_228": 228,
334
+ "LABEL_229": 229,
335
+ "LABEL_230": 230,
336
+ "LABEL_231": 231,
337
+ "LABEL_232": 232,
338
+ "LABEL_233": 233,
339
+ "LABEL_234": 234,
340
+ "LABEL_235": 235,
341
+ "LABEL_236": 236,
342
+ "LABEL_237": 237,
343
+ "LABEL_238": 238,
344
+ "LABEL_239": 239,
345
+ "LABEL_240": 240,
346
+ "LABEL_241": 241,
347
+ "LABEL_242": 242,
348
+ "LABEL_243": 243,
349
+ "LABEL_244": 244,
350
+ "LABEL_245": 245,
351
+ "LABEL_246": 246,
352
+ "LABEL_247": 247,
353
+ "LABEL_248": 248,
354
+ "LABEL_249": 249,
355
+ "N/A": 0,
356
+ "airplane": 5,
357
+ "apple": 53,
358
+ "backpack": 27,
359
+ "banana": 52,
360
+ "banner": 92,
361
+ "baseball bat": 39,
362
+ "baseball glove": 40,
363
+ "bear": 23,
364
+ "bed": 65,
365
+ "bench": 15,
366
+ "bicycle": 2,
367
+ "bird": 16,
368
+ "blanket": 93,
369
+ "blender": 83,
370
+ "boat": 9,
371
+ "book": 84,
372
+ "bottle": 44,
373
+ "bowl": 51,
374
+ "branch": 94,
375
+ "bridge": 95,
376
+ "broccoli": 56,
377
+ "building-other": 96,
378
+ "bus": 6,
379
+ "bush": 97,
380
+ "cabinet": 98,
381
+ "cage": 99,
382
+ "cake": 61,
383
+ "car": 3,
384
+ "cardboard": 100,
385
+ "carpet": 101,
386
+ "carrot": 57,
387
+ "cat": 17,
388
+ "ceiling-other": 102,
389
+ "ceiling-tile": 103,
390
+ "cell phone": 77,
391
+ "chair": 62,
392
+ "clock": 85,
393
+ "cloth": 104,
394
+ "clothes": 105,
395
+ "clouds": 106,
396
+ "couch": 63,
397
+ "counter": 107,
398
+ "cow": 21,
399
+ "cup": 47,
400
+ "cupboard": 108,
401
+ "curtain": 109,
402
+ "desk": 69,
403
+ "desk-stuff": 110,
404
+ "dining table": 67,
405
+ "dirt": 111,
406
+ "dog": 18,
407
+ "donut": 60,
408
+ "door": 71,
409
+ "door-stuff": 112,
410
+ "elephant": 22,
411
+ "eye glasses": 30,
412
+ "fence": 113,
413
+ "fire hydrant": 11,
414
+ "floor-marble": 114,
415
+ "floor-other": 115,
416
+ "floor-stone": 116,
417
+ "floor-tile": 117,
418
+ "floor-wood": 118,
419
+ "flower": 119,
420
+ "fog": 120,
421
+ "food-other": 121,
422
+ "fork": 48,
423
+ "frisbee": 34,
424
+ "fruit": 122,
425
+ "furniture-other": 123,
426
+ "giraffe": 25,
427
+ "grass": 124,
428
+ "gravel": 125,
429
+ "ground-other": 126,
430
+ "hair brush": 91,
431
+ "hair drier": 89,
432
+ "handbag": 31,
433
+ "hat": 26,
434
+ "hill": 127,
435
+ "horse": 19,
436
+ "hot dog": 58,
437
+ "house": 128,
438
+ "keyboard": 76,
439
+ "kite": 38,
440
+ "knife": 49,
441
+ "laptop": 73,
442
+ "leaves": 129,
443
+ "light": 130,
444
+ "mat": 131,
445
+ "metal": 132,
446
+ "microwave": 78,
447
+ "mirror": 66,
448
+ "mirror-stuff": 133,
449
+ "moss": 134,
450
+ "motorcycle": 4,
451
+ "mountain": 135,
452
+ "mouse": 74,
453
+ "mud": 136,
454
+ "napkin": 137,
455
+ "net": 138,
456
+ "orange": 55,
457
+ "oven": 79,
458
+ "paper": 139,
459
+ "parking meter": 14,
460
+ "pavement": 140,
461
+ "person": 1,
462
+ "pillow": 141,
463
+ "pizza": 59,
464
+ "plant-other": 142,
465
+ "plastic": 143,
466
+ "plate": 45,
467
+ "platform": 144,
468
+ "playingfield": 145,
469
+ "potted plant": 64,
470
+ "railing": 146,
471
+ "railroad": 147,
472
+ "refrigerator": 82,
473
+ "remote": 75,
474
+ "river": 148,
475
+ "road": 149,
476
+ "rock": 150,
477
+ "roof": 151,
478
+ "rug": 152,
479
+ "salad": 153,
480
+ "sand": 154,
481
+ "sandwich": 54,
482
+ "scissors": 87,
483
+ "sea": 155,
484
+ "sheep": 20,
485
+ "shelf": 156,
486
+ "shoe": 29,
487
+ "sink": 81,
488
+ "skateboard": 41,
489
+ "skis": 35,
490
+ "sky-other": 157,
491
+ "skyscraper": 158,
492
+ "snow": 159,
493
+ "snowboard": 36,
494
+ "solid-other": 160,
495
+ "spoon": 50,
496
+ "sports ball": 37,
497
+ "stairs": 161,
498
+ "stone": 162,
499
+ "stop sign": 13,
500
+ "straw": 163,
501
+ "street sign": 12,
502
+ "structural-other": 164,
503
+ "suitcase": 33,
504
+ "surfboard": 42,
505
+ "table": 165,
506
+ "teddy bear": 88,
507
+ "tennis racket": 43,
508
+ "tent": 166,
509
+ "textile-other": 167,
510
+ "tie": 32,
511
+ "toaster": 80,
512
+ "toilet": 70,
513
+ "toothbrush": 90,
514
+ "towel": 168,
515
+ "traffic light": 10,
516
+ "train": 7,
517
+ "tree": 169,
518
+ "truck": 8,
519
+ "tv": 72,
520
+ "umbrella": 28,
521
+ "vase": 86,
522
+ "vegetable": 170,
523
+ "wall-brick": 171,
524
+ "wall-concrete": 172,
525
+ "wall-other": 173,
526
+ "wall-panel": 174,
527
+ "wall-stone": 175,
528
+ "wall-tile": 176,
529
+ "wall-wood": 177,
530
+ "water-other": 178,
531
+ "waterdrops": 179,
532
+ "window": 68,
533
+ "window-blind": 180,
534
+ "window-other": 181,
535
+ "wine glass": 46,
536
+ "wood": 182,
537
+ "zebra": 24
538
+ },
539
+ "mask_loss_coefficient": 1,
540
+ "max_position_embeddings": 1024,
541
+ "model_type": "detr",
542
+ "num_channels": 3,
543
+ "num_hidden_layers": 6,
544
+ "num_queries": 100,
545
+ "position_embedding_type": "sine",
546
+ "scale_embedding": false,
547
+ "transformers_version": "4.7.0.dev0",
548
+ "use_pretrained_backbone": true,
549
+ "use_timm_backbone": true
550
+ }
quantized/facebook/detr-resnet-50-panoptic/image-segmentation/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca23bd2f604c3866222e658b7c239660fad4abd77e72b1027c6e80d339db09c6
3
+ size 172282718
quantized/facebook/detr-resnet-50-panoptic/image-segmentation/preprocessor_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "do_resize": true,
4
+ "feature_extractor_type": "DetrFeatureExtractor",
5
+ "format": "coco_panoptic",
6
+ "image_mean": [
7
+ 0.485,
8
+ 0.456,
9
+ 0.406
10
+ ],
11
+ "image_std": [
12
+ 0.229,
13
+ 0.224,
14
+ 0.225
15
+ ],
16
+ "max_size": 1333,
17
+ "size": 800
18
+ }