huuquyet commited on
Commit
63668ed
1 Parent(s): 8835def

feat: Update converted model

Browse files
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f98bb48af59b4056fc2ead555a622ccabb6e3ccce08cfdf6b5f14d7ddfe8340d
3
  size 118384989
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cd895ce0365bd5584ccfaeef6e3f4bc073f5e016daedab0a552f0915f8258ba
3
  size 118384989
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:306f3f9a0e73d7969d4c7a30c4d4b1cfb7f7ee42da25957f9f4436bf4f5d4d37
3
  size 118533120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c169b8c330d4345cdf607e23dbff2664bad8c767c7ead33343248a3df773bf5
3
  size 118533120
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:186ab8c54100916d8a80c1f0f5841079e32d8e9dcf361365b3a78a92cf172664
3
  size 30667401
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a36371f1eac6675aec784a6cdb35f29154d3cf95bd8969f434c40269f11112d
3
  size 30667401
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae0df86d12374c58a759fc6144934d897e6aaada7714a1ba8975563e0ce050d4
3
  size 113630778
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10b42204abf25cb1cdc5b157e3ebf10c07fbf3d4a7c1bcace0930643442b7227
3
  size 113630778
onnx/encoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65844ff13890acf9fa4e01bdd6e01c3ad77f89664ee4098337fb28d19cea2fa6
3
  size 32900724
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21170c18ab8ef382e5a6188e99f348f93877e451e1e4e2732d5a5cf13a6db69d
3
  size 32900724
quantize_config.json CHANGED
@@ -4,110 +4,110 @@
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
- "Mul",
8
- "Pow",
9
- "Add",
10
- "Div",
11
- "Softmax",
12
- "Conv",
13
  "Erf",
14
- "Sub",
15
- "Transpose",
16
- "Reshape",
17
- "Gather",
18
- "ReduceMean",
19
- "Sqrt",
20
  "Constant",
 
 
21
  "MatMul",
22
  "Concat",
 
 
 
 
 
 
23
  "Unsqueeze",
24
- "Shape"
 
 
25
  ],
26
  "weight_type": "QUInt8"
27
  },
28
  "decoder_model": {
29
  "op_types": [
30
- "Pow",
 
31
  "Expand",
32
- "Transpose",
33
- "Less",
34
- "Softmax",
35
- "Range",
36
- "ConstantOfShape",
37
- "Mul",
38
- "Add",
39
  "Sub",
40
- "Where",
41
- "Gather",
42
- "Squeeze",
43
- "MatMul",
44
- "Erf",
45
- "Cast",
46
- "Reshape",
47
  "Concat",
 
48
  "Unsqueeze",
49
- "Div",
50
- "Slice",
51
  "Equal",
52
- "ReduceMean",
53
- "Sqrt",
54
  "Constant",
55
- "Shape"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
56
  ],
57
  "weight_type": "QInt8"
58
  },
59
  "decoder_with_past_model": {
60
  "op_types": [
61
- "Mul",
62
- "Pow",
63
  "Add",
64
- "Div",
65
- "Softmax",
66
  "Slice",
67
  "Sub",
68
- "Erf",
69
- "Transpose",
70
- "Reshape",
71
- "Gather",
72
  "ReduceMean",
 
73
  "Sqrt",
74
- "Concat",
75
- "Constant",
76
- "MatMul",
77
  "Unsqueeze",
78
- "Shape"
 
 
79
  ],
80
  "weight_type": "QInt8"
81
  },
82
  "decoder_model_merged": {
83
  "op_types": [
84
- "Pow",
 
85
  "Expand",
86
- "Transpose",
87
- "Less",
88
- "Softmax",
89
- "Range",
90
- "ConstantOfShape",
91
- "Mul",
92
- "Add",
93
  "Sub",
94
- "Where",
95
- "Gather",
96
- "Squeeze",
97
- "MatMul",
98
- "Erf",
99
- "Cast",
100
- "Reshape",
101
  "Concat",
102
- "Unsqueeze",
103
- "Div",
104
  "If",
105
- "Slice",
 
106
  "Equal",
107
- "ReduceMean",
108
- "Sqrt",
109
  "Constant",
110
- "Shape"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
111
  ],
112
  "weight_type": "QInt8"
113
  }
 
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
 
 
 
 
 
 
7
  "Erf",
8
+ "Add",
9
+ "Mul",
 
 
 
 
10
  "Constant",
11
+ "Sub",
12
+ "Div",
13
  "MatMul",
14
  "Concat",
15
+ "ReduceMean",
16
+ "Transpose",
17
+ "Sqrt",
18
+ "Pow",
19
+ "Conv",
20
+ "Gather",
21
  "Unsqueeze",
22
+ "Softmax",
23
+ "Shape",
24
+ "Reshape"
25
  ],
26
  "weight_type": "QUInt8"
27
  },
28
  "decoder_model": {
29
  "op_types": [
30
+ "Erf",
31
+ "Squeeze",
32
  "Expand",
 
 
 
 
 
 
 
33
  "Sub",
 
 
 
 
 
 
 
34
  "Concat",
35
+ "Sqrt",
36
  "Unsqueeze",
37
+ "Range",
 
38
  "Equal",
 
 
39
  "Constant",
40
+ "ConstantOfShape",
41
+ "ReduceMean",
42
+ "Transpose",
43
+ "Gather",
44
+ "Less",
45
+ "Shape",
46
+ "Add",
47
+ "Slice",
48
+ "Div",
49
+ "Where",
50
+ "Reshape",
51
+ "Cast",
52
+ "Mul",
53
+ "MatMul",
54
+ "Pow",
55
+ "Softmax"
56
  ],
57
  "weight_type": "QInt8"
58
  },
59
  "decoder_with_past_model": {
60
  "op_types": [
61
+ "Erf",
 
62
  "Add",
63
+ "Mul",
64
+ "Constant",
65
  "Slice",
66
  "Sub",
67
+ "Div",
68
+ "MatMul",
69
+ "Concat",
 
70
  "ReduceMean",
71
+ "Transpose",
72
  "Sqrt",
73
+ "Pow",
74
+ "Gather",
 
75
  "Unsqueeze",
76
+ "Softmax",
77
+ "Shape",
78
+ "Reshape"
79
  ],
80
  "weight_type": "QInt8"
81
  },
82
  "decoder_model_merged": {
83
  "op_types": [
84
+ "Erf",
85
+ "Squeeze",
86
  "Expand",
 
 
 
 
 
 
 
87
  "Sub",
 
 
 
 
 
 
 
88
  "Concat",
89
+ "Sqrt",
 
90
  "If",
91
+ "Unsqueeze",
92
+ "Range",
93
  "Equal",
 
 
94
  "Constant",
95
+ "ConstantOfShape",
96
+ "ReduceMean",
97
+ "Transpose",
98
+ "Gather",
99
+ "Less",
100
+ "Shape",
101
+ "Add",
102
+ "Slice",
103
+ "Div",
104
+ "Where",
105
+ "Reshape",
106
+ "Cast",
107
+ "Mul",
108
+ "MatMul",
109
+ "Pow",
110
+ "Softmax"
111
  ],
112
  "weight_type": "QInt8"
113
  }