Xenova HF staff commited on
Commit
d45afc1
1 Parent(s): bfc15f2

Upload folder using huggingface_hub

Browse files
onnx/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73d198faf765aae8f5a5a74aa4450205002422d16a0241c38d2c17c62860fa7d
3
+ size 34343075
onnx/decoder_model_merged.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d7634cfd9726ef91a6777c9c40450cc5b728c16a709d68251b025f435c0b58c
3
+ size 7347314688
onnx/decoder_model_merged_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cac9ed16a7533d67a6661aa99c06f3d1b0c1aed076f36dbb543fb3e826f9bb58
3
+ size 1872316846
quantize_config.json CHANGED
@@ -4,34 +4,34 @@
4
  "per_model_config": {
5
  "model": {
6
  "op_types": [
7
- "Gather",
8
- "Reshape",
9
- "Less",
10
  "Sqrt",
 
 
 
11
  "Shape",
 
 
12
  "Slice",
13
- "Sigmoid",
14
- "Where",
15
- "ConstantOfShape",
16
- "Unsqueeze",
17
- "Cast",
18
  "Add",
19
- "Sub",
20
- "ReduceMean",
21
  "Pow",
22
- "Div",
23
- "Concat",
24
- "Neg",
25
  "Trilu",
26
- "Equal",
27
- "Expand",
28
- "Transpose",
29
- "Softmax",
30
- "Squeeze",
31
  "Constant",
32
- "MatMul",
33
- "Range",
34
- "Mul"
 
 
 
 
 
 
 
35
  ],
36
  "weight_type": "QInt8"
37
  }
 
4
  "per_model_config": {
5
  "model": {
6
  "op_types": [
7
+ "Sub",
8
+ "Sigmoid",
 
9
  "Sqrt",
10
+ "Equal",
11
+ "Less",
12
+ "Softmax",
13
  "Shape",
14
+ "MatMul",
15
+ "ReduceMean",
16
  "Slice",
17
+ "Transpose",
18
+ "Neg",
19
+ "Range",
 
 
20
  "Add",
21
+ "Mul",
 
22
  "Pow",
 
 
 
23
  "Trilu",
 
 
 
 
 
24
  "Constant",
25
+ "Gather",
26
+ "Concat",
27
+ "Squeeze",
28
+ "Div",
29
+ "Reshape",
30
+ "Expand",
31
+ "Cast",
32
+ "ConstantOfShape",
33
+ "Unsqueeze",
34
+ "Where"
35
  ],
36
  "weight_type": "QInt8"
37
  }