Xenova HF staff commited on
Commit
322a488
1 Parent(s): 358f2f2

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -11,7 +11,7 @@
11
  "prompt_encoder_config": {
12
  "model_type": ""
13
  },
14
- "transformers_version": "4.36.2",
15
  "vision_config": {
16
  "hidden_size": 168,
17
  "mlp_dim": 696,
 
11
  "prompt_encoder_config": {
12
  "model_type": ""
13
  },
14
+ "transformers_version": "4.37.2",
15
  "vision_config": {
16
  "hidden_size": 168,
17
  "mlp_dim": 696,
onnx/prompt_encoder_mask_decoder.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4514391764fbd56e08e119060d874ecd7d52994bfb1968af159e12d4943b5bb
3
- size 16557892
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a4c26d6cada5bb9fc394237450ad166f006e3e64eab97238d73b1a91846206a
3
+ size 16640335
onnx/prompt_encoder_mask_decoder_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb90b279f549d2cab7fd6e20c38522438c65d84bdcca3d2a764cff7d857fdce2
3
- size 4903810
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e95d495de5db3bd02d303c525b3003287c6df3d231c7b358559a5520c96fd372
3
+ size 5020129
onnx/vision_encoder.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f8433273a6750b587779baa0cf5508111001bf7e7acfcf585d370139fd366d0
3
- size 23276014
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24bd98fd8e375b257aed9550ef2b25bf026004bdf1e233bfc15d0475c627441f
3
+ size 23275998
onnx/vision_encoder_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cce23c7b2e5d4f330932738fb67ba518e04b0d99ccdd1cccd22a7da4e01f2971
3
- size 8882165
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a1cbc7db99bec8baa85ec2368c72230e75dc17b664ecec539e6fbbd8aa1ab28
3
+ size 8882149
preprocessor_config.json CHANGED
@@ -15,6 +15,13 @@
15
  0.224,
16
  0.225
17
  ],
 
 
 
 
 
 
 
18
  "pad_size": {
19
  "height": 1024,
20
  "width": 1024
 
15
  0.224,
16
  0.225
17
  ],
18
+ "mask_pad_size": {
19
+ "height": 256,
20
+ "width": 256
21
+ },
22
+ "mask_size": {
23
+ "longest_edge": 256
24
+ },
25
  "pad_size": {
26
  "height": 1024,
27
  "width": 1024
quantize_config.json CHANGED
@@ -2,81 +2,80 @@
2
  "per_channel": true,
3
  "reduce_range": true,
4
  "per_model_config": {
5
- "prompt_encoder_mask_decoder": {
6
  "op_types": [
7
- "Gather",
8
- "Sin",
9
- "Unsqueeze",
10
- "Not",
11
- "Cast",
12
- "Equal",
13
- "Neg",
14
- "MatMul",
15
- "Cos",
16
- "OneHot",
17
- "Transpose",
18
- "Sub",
19
- "Where",
20
  "Erf",
21
- "ConstantOfShape",
22
- "ReduceMean",
23
- "Shape",
24
- "Range",
25
- "Expand",
26
- "Div",
27
- "Relu",
28
- "ConvTranspose",
29
  "Tile",
30
  "Concat",
31
- "ScatterND",
 
 
 
 
32
  "Sqrt",
33
- "Slice",
34
- "Mul",
 
 
 
 
 
35
  "Constant",
36
- "Pow",
37
- "Reshape",
 
 
 
38
  "Add",
39
- "Softmax"
 
 
 
 
40
  ],
41
- "weight_type": "QInt8"
42
  },
43
- "vision_encoder": {
44
  "op_types": [
45
- "Gather",
46
- "Sin",
 
 
47
  "Unsqueeze",
 
 
 
 
 
 
 
 
 
48
  "Cast",
49
- "MatMul",
50
  "Cos",
51
- "Transpose",
52
- "Sub",
53
- "Pad",
54
- "Erf",
55
- "Conv",
56
- "ConstantOfShape",
57
- "Resize",
58
  "ReduceMean",
 
 
 
 
59
  "Shape",
 
60
  "Range",
61
- "Expand",
62
- "Div",
63
- "Tile",
64
- "Mod",
65
- "Squeeze",
66
- "Concat",
67
- "Sqrt",
68
- "Split",
69
- "Mul",
70
- "Slice",
71
- "Identity",
72
- "Constant",
73
  "Pow",
74
- "Einsum",
75
- "Reshape",
76
- "Add",
77
- "Softmax"
78
  ],
79
- "weight_type": "QUInt8"
80
  }
81
  }
82
  }
 
2
  "per_channel": true,
3
  "reduce_range": true,
4
  "per_model_config": {
5
+ "vision_encoder": {
6
  "op_types": [
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  "Erf",
8
+ "Squeeze",
9
+ "Pad",
10
+ "Mul",
11
+ "Split",
12
+ "Unsqueeze",
 
 
 
13
  "Tile",
14
  "Concat",
15
+ "Einsum",
16
+ "Reshape",
17
+ "Expand",
18
+ "Transpose",
19
+ "Sub",
20
  "Sqrt",
21
+ "Identity",
22
+ "Cast",
23
+ "Softmax",
24
+ "Cos",
25
+ "Mod",
26
+ "Div",
27
+ "ReduceMean",
28
  "Constant",
29
+ "Slice",
30
+ "ConstantOfShape",
31
+ "Range",
32
+ "Resize",
33
+ "Conv",
34
  "Add",
35
+ "MatMul",
36
+ "Shape",
37
+ "Gather",
38
+ "Pow",
39
+ "Sin"
40
  ],
41
+ "weight_type": "QUInt8"
42
  },
43
+ "prompt_encoder_mask_decoder": {
44
  "op_types": [
45
+ "Erf",
46
+ "Relu",
47
+ "Mul",
48
+ "Where",
49
  "Unsqueeze",
50
+ "Tile",
51
+ "ScatterND",
52
+ "Concat",
53
+ "Reshape",
54
+ "ConvTranspose",
55
+ "Expand",
56
+ "Sub",
57
+ "Transpose",
58
+ "Sqrt",
59
  "Cast",
60
+ "Softmax",
61
  "Cos",
62
+ "Div",
63
+ "Constant",
 
 
 
 
 
64
  "ReduceMean",
65
+ "Slice",
66
+ "ConstantOfShape",
67
+ "Not",
68
+ "Add",
69
  "Shape",
70
+ "Gather",
71
  "Range",
72
+ "MatMul",
73
+ "OneHot",
 
 
 
 
 
 
 
 
 
 
74
  "Pow",
75
+ "Equal",
76
+ "Sin"
 
 
77
  ],
78
+ "weight_type": "QInt8"
79
  }
80
  }
81
  }