Xenova HF staff commited on
Commit
e543552
1 Parent(s): dcd52d5

Upload folder using huggingface_hub

Browse files
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:697a94ad777226e8b7eb83ab3ffa6c23614e156063f96fc530a61b9ad1d42909
3
  size 819827967
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c15a6f30dad41c3265f6786dbd850b6c563d9e6cca0197a1517822ccf2cb44b
3
  size 819827967
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f13b225f3ac82972f03a43ab7419c489612acf9b66c47a97d0cd8390641c721
3
- size 206174232
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06a8b2aad1811a49576bb1fae43142bd91fc90204065a363191268ee84a7cd28
3
+ size 206825235
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:607ea7b1b4cdea8c574f4778fddf8399bb953c2f4dd52afb88188d0757a0a98c
3
- size 205786985
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b704da825ee605a2576a88093fed2442978b00309d3a576337ae2fe1ac843fcf
3
+ size 206437988
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d68b0a160502ea0e6d5af0144fbaed6ebb78cdb1bbae4beeb4e37e4131e8810
3
- size 193085165
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8615325c7835f7734c6c6ed53264dc85f9954db1f176697cf033fc596fc7f52c
3
+ size 193674668
onnx/encoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ffb6c0547b82b923abff346f03b2f0d75489bd71bdacc2fb773a9dc5d94b7d68
3
- size 128543065
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14d9b2d8fb1b6ebf7133046eaba3ea0dc0539be0523caa14c3e9b22131518a02
3
+ size 128819737
quantize_config.json CHANGED
@@ -1,123 +1,123 @@
1
  {
2
- "per_channel": false,
3
- "reduce_range": false,
4
  "per_model_config": {
5
  "decoder_model": {
6
  "op_types": [
7
  "Cast",
8
- "Reshape",
9
- "Gather",
10
- "Sub",
11
  "Slice",
12
- "Erf",
13
- "Less",
14
- "Mul",
15
- "Div",
16
  "Pow",
 
17
  "MatMul",
18
- "Add",
 
19
  "Equal",
 
 
 
20
  "Softmax",
21
- "Transpose",
22
- "Sqrt",
23
  "ConstantOfShape",
24
- "Concat",
25
- "Unsqueeze",
26
- "Expand",
27
- "Constant",
28
- "ReduceMean",
29
  "Range",
30
- "Squeeze",
31
- "Where",
32
- "Shape"
 
 
 
33
  ],
34
  "weight_type": "QInt8"
35
  },
36
  "decoder_model_merged": {
37
  "op_types": [
38
  "Cast",
39
- "Reshape",
40
- "Gather",
41
- "Sub",
42
- "Slice",
43
- "Erf",
44
- "Less",
45
- "Mul",
46
- "Div",
47
- "Pow",
48
- "MatMul",
49
- "Add",
50
  "If",
51
- "Equal",
52
- "Softmax",
53
  "Transpose",
54
- "Sqrt",
55
- "ConstantOfShape",
56
  "Concat",
57
  "Unsqueeze",
 
 
58
  "Expand",
 
 
 
 
 
 
59
  "Constant",
60
- "ReduceMean",
61
- "Range",
62
  "Squeeze",
63
- "Where",
64
- "Shape"
 
 
 
 
 
 
65
  ],
66
  "weight_type": "QInt8"
67
  },
68
  "decoder_with_past_model": {
69
  "op_types": [
70
- "Reshape",
71
  "Cast",
72
- "Gather",
73
- "Sub",
74
- "Erf",
75
- "Mul",
76
- "Div",
77
- "Pow",
78
- "MatMul",
79
- "Add",
80
- "Equal",
81
- "Softmax",
82
  "Transpose",
83
- "Sqrt",
84
- "ConstantOfShape",
85
  "Concat",
86
  "Unsqueeze",
 
 
87
  "Expand",
 
 
 
 
 
 
88
  "Constant",
89
- "ReduceMean",
 
 
90
  "Range",
91
- "Where",
92
- "Shape"
 
 
 
93
  ],
94
  "weight_type": "QInt8"
95
  },
96
  "encoder_model": {
97
  "op_types": [
98
- "Reshape",
99
  "Cast",
100
- "Gather",
101
- "Sub",
102
- "Erf",
103
- "Mul",
104
- "Div",
105
- "Pow",
106
- "MatMul",
107
- "Add",
108
- "Equal",
109
- "Softmax",
110
  "Transpose",
111
- "Sqrt",
112
- "ConstantOfShape",
113
  "Concat",
114
  "Unsqueeze",
 
 
115
  "Expand",
 
 
 
 
 
 
116
  "Constant",
117
- "ReduceMean",
 
 
118
  "Range",
119
- "Where",
120
- "Shape"
 
 
 
121
  ],
122
  "weight_type": "QInt8"
123
  }
 
1
  {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
  "per_model_config": {
5
  "decoder_model": {
6
  "op_types": [
7
  "Cast",
8
+ "Transpose",
 
 
9
  "Slice",
10
+ "Concat",
11
+ "Unsqueeze",
12
+ "Where",
 
13
  "Pow",
14
+ "Expand",
15
  "MatMul",
16
+ "Sub",
17
+ "Div",
18
  "Equal",
19
+ "Mul",
20
+ "Gather",
21
+ "Constant",
22
  "Softmax",
23
+ "Shape",
24
+ "Squeeze",
25
  "ConstantOfShape",
 
 
 
 
 
26
  "Range",
27
+ "Less",
28
+ "Add",
29
+ "Sqrt",
30
+ "Reshape",
31
+ "ReduceMean",
32
+ "Erf"
33
  ],
34
  "weight_type": "QInt8"
35
  },
36
  "decoder_model_merged": {
37
  "op_types": [
38
  "Cast",
 
 
 
 
 
 
 
 
 
 
 
39
  "If",
 
 
40
  "Transpose",
41
+ "Slice",
 
42
  "Concat",
43
  "Unsqueeze",
44
+ "Where",
45
+ "Pow",
46
  "Expand",
47
+ "MatMul",
48
+ "Sub",
49
+ "Div",
50
+ "Equal",
51
+ "Mul",
52
+ "Gather",
53
  "Constant",
54
+ "Softmax",
55
+ "Shape",
56
  "Squeeze",
57
+ "ConstantOfShape",
58
+ "Range",
59
+ "Less",
60
+ "Add",
61
+ "Sqrt",
62
+ "Reshape",
63
+ "ReduceMean",
64
+ "Erf"
65
  ],
66
  "weight_type": "QInt8"
67
  },
68
  "decoder_with_past_model": {
69
  "op_types": [
 
70
  "Cast",
 
 
 
 
 
 
 
 
 
 
71
  "Transpose",
 
 
72
  "Concat",
73
  "Unsqueeze",
74
+ "Where",
75
+ "Pow",
76
  "Expand",
77
+ "MatMul",
78
+ "Sub",
79
+ "Div",
80
+ "Equal",
81
+ "Mul",
82
+ "Gather",
83
  "Constant",
84
+ "Softmax",
85
+ "Shape",
86
+ "ConstantOfShape",
87
  "Range",
88
+ "Add",
89
+ "Sqrt",
90
+ "Reshape",
91
+ "ReduceMean",
92
+ "Erf"
93
  ],
94
  "weight_type": "QInt8"
95
  },
96
  "encoder_model": {
97
  "op_types": [
 
98
  "Cast",
 
 
 
 
 
 
 
 
 
 
99
  "Transpose",
 
 
100
  "Concat",
101
  "Unsqueeze",
102
+ "Where",
103
+ "Pow",
104
  "Expand",
105
+ "MatMul",
106
+ "Sub",
107
+ "Div",
108
+ "Equal",
109
+ "Mul",
110
+ "Gather",
111
  "Constant",
112
+ "Softmax",
113
+ "Shape",
114
+ "ConstantOfShape",
115
  "Range",
116
+ "Add",
117
+ "Sqrt",
118
+ "Reshape",
119
+ "ReduceMean",
120
+ "Erf"
121
  ],
122
  "weight_type": "QInt8"
123
  }