Xenova HF staff commited on
Commit
520220e
1 Parent(s): 7a51d9c

Upload folder using huggingface_hub

Browse files
onnx/text_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a86051a90491b97e2ea1d0351ef664926735bca7536034384f901915ee91fd69
3
+ size 494947485
onnx/text_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d31c7a212681c3918d78193b6b4f98c70fe540577f9a0a57fe7ba8c7439244c
3
+ size 124987663
onnx/vision_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff49f8aa57c7abfd26e382eb083e4dbf988505223a9bd3767dbfd4e729206709
3
+ size 1216438437
onnx/vision_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a658de8944a2001719beabf6c5030cfe7b3dc80e85983f69fc648d6b4d7ec0f
3
+ size 307001500
quantize_config.json CHANGED
@@ -2,42 +2,67 @@
2
  "per_channel": true,
3
  "reduce_range": true,
4
  "per_model_config": {
5
- "model": {
6
  "op_types": [
7
- "ArgMax",
8
- "Less",
9
- "Div",
10
  "Concat",
11
- "Where",
12
- "Expand",
13
- "ReduceSum",
14
- "Mul",
15
- "Cast",
16
- "MatMul",
17
  "Slice",
18
- "Squeeze",
19
- "Exp",
20
- "ReduceMean",
21
  "Gather",
 
 
 
 
 
22
  "Sqrt",
 
 
 
23
  "Conv",
24
- "Unsqueeze",
 
 
 
25
  "Pow",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  "Add",
 
 
 
 
 
 
 
 
27
  "Reshape",
 
 
28
  "Sub",
29
- "Softmax",
30
- "Range",
31
- "Constant",
32
  "ConstantOfShape",
33
- "Shape",
34
- "Abs",
35
- "Transpose",
36
  "Equal",
37
- "Sigmoid",
38
- "Flatten"
 
 
39
  ],
40
- "weight_type": "QUInt8"
41
  }
42
  }
43
  }
 
2
  "per_channel": true,
3
  "reduce_range": true,
4
  "per_model_config": {
5
+ "vision_model": {
6
  "op_types": [
7
+ "Constant",
8
+ "Shape",
 
9
  "Concat",
 
 
 
 
 
 
10
  "Slice",
11
+ "Mul",
12
+ "Div",
13
+ "Add",
14
  "Gather",
15
+ "Transpose",
16
+ "MatMul",
17
+ "Expand",
18
+ "Sigmoid",
19
+ "Unsqueeze",
20
  "Sqrt",
21
+ "Reshape",
22
+ "ReduceMean",
23
+ "Where",
24
  "Conv",
25
+ "Sub",
26
+ "ConstantOfShape",
27
+ "Cast",
28
+ "Equal",
29
  "Pow",
30
+ "Softmax"
31
+ ],
32
+ "weight_type": "QUInt8"
33
+ },
34
+ "text_model": {
35
+ "op_types": [
36
+ "Constant",
37
+ "Range",
38
+ "Shape",
39
+ "Flatten",
40
+ "Concat",
41
+ "Slice",
42
+ "Mul",
43
+ "Div",
44
  "Add",
45
+ "Gather",
46
+ "ArgMax",
47
+ "Transpose",
48
+ "MatMul",
49
+ "Expand",
50
+ "Sigmoid",
51
+ "Unsqueeze",
52
+ "Sqrt",
53
  "Reshape",
54
+ "ReduceMean",
55
+ "Where",
56
  "Sub",
 
 
 
57
  "ConstantOfShape",
58
+ "Cast",
 
 
59
  "Equal",
60
+ "Pow",
61
+ "Less",
62
+ "Squeeze",
63
+ "Softmax"
64
  ],
65
+ "weight_type": "QInt8"
66
  }
67
  }
68
  }