File size: 3,112 Bytes
690919f
 
 
 
418a5c8
690919f
61f54c3
9b9dca5
418a5c8
61f54c3
418a5c8
 
 
 
 
 
61f54c3
418a5c8
 
 
 
 
 
9b9dca5
61f54c3
418a5c8
 
 
 
9b9dca5
418a5c8
9b9dca5
 
 
61f54c3
9b9dca5
61f54c3
418a5c8
 
 
 
 
61f54c3
418a5c8
 
 
 
 
 
690919f
418a5c8
 
 
 
 
61f54c3
418a5c8
 
 
690919f
 
 
418a5c8
690919f
61f54c3
 
 
418a5c8
 
 
 
 
61f54c3
418a5c8
 
 
 
 
 
 
 
 
 
 
61f54c3
 
418a5c8
 
 
9b9dca5
418a5c8
9b9dca5
 
 
61f54c3
9b9dca5
61f54c3
418a5c8
 
 
 
 
 
61f54c3
418a5c8
 
 
 
 
9b9dca5
418a5c8
 
 
 
 
 
61f54c3
418a5c8
 
 
690919f
9b9dca5
690919f
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
{
    "per_channel": false,
    "reduce_range": false,
    "per_model_config": {
        "encoder_model": {
            "op_types": [
                "MatMul",
                "Add",
                "Equal",
                "ConstantOfShape",
                "Pow",
                "Erf",
                "Sub",
                "Mul",
                "Reshape",
                "Div",
                "Where",
                "Unsqueeze",
                "Expand",
                "Gather",
                "Softmax",
                "Transpose",
                "Constant",
                "Shape",
                "ReduceMean",
                "Concat",
                "Sqrt",
                "Slice",
                "Conv"
            ],
            "weight_type": "QUInt8"
        },
        "decoder_model": {
            "op_types": [
                "MatMul",
                "Add",
                "ConstantOfShape",
                "Pow",
                "Sub",
                "Mul",
                "Reshape",
                "Div",
                "Where",
                "Tanh",
                "Unsqueeze",
                "Gather",
                "Softmax",
                "Split",
                "Slice",
                "Squeeze",
                "Range",
                "Transpose",
                "Cast",
                "Constant",
                "Shape",
                "ReduceMean",
                "Concat",
                "Sqrt",
                "Gemm"
            ],
            "weight_type": "QInt8"
        },
        "decoder_with_past_model": {
            "op_types": [
                "MatMul",
                "Add",
                "ConstantOfShape",
                "Pow",
                "Sub",
                "Mul",
                "Reshape",
                "Div",
                "Where",
                "Tanh",
                "Unsqueeze",
                "Gather",
                "Softmax",
                "Split",
                "Slice",
                "Squeeze",
                "Range",
                "Transpose",
                "Cast",
                "Constant",
                "Shape",
                "ReduceMean",
                "Concat",
                "Sqrt",
                "Gemm"
            ],
            "weight_type": "QInt8"
        },
        "decoder_model_merged": {
            "op_types": [
                "MatMul",
                "Add",
                "ConstantOfShape",
                "Pow",
                "Sub",
                "Mul",
                "Gemm",
                "Reshape",
                "Div",
                "Where",
                "Tanh",
                "Unsqueeze",
                "Gather",
                "Softmax",
                "Split",
                "Squeeze",
                "Range",
                "Transpose",
                "Cast",
                "Constant",
                "If",
                "Shape",
                "ReduceMean",
                "Concat",
                "Sqrt",
                "Slice"
            ],
            "weight_type": "QInt8"
        }
    }
}