Upload folder using huggingface_hub

Browse files

Files changed (5) hide show

onnx/decoder_model_merged.onnx +1 -1
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +66 -66

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1b0f375b96dd3a76b25f4d5377eda6376faae560682bed258510f0bbd8289470
 size 791453859

 version https://git-lfs.github.com/spec/v1
+oid sha256:55fbbfbdd774d0f4cc2a92f59f11e58584539d3a92dfb6536f65d4d3c1c4f57a
 size 791453859

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:be7061281a908c61b62bd0bc9dea7a707a72d55a374deab3ccfaec173acc2aa2
-size 299954775

 version https://git-lfs.github.com/spec/v1
+oid sha256:4699d4bb1950bb65f77e2f6ce1b26a51f26fdb5813e22581efcf0c40fd8b95b4
+size 300505575

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6889a8fdc9daf18b7aa3c6124684eaffd0fb2fba6ee0103064ad719d79d7bf0a
-size 232306103

 version https://git-lfs.github.com/spec/v1
+oid sha256:3a960ff52fcdff888c99beb87c7a497165a3e2201b3c24777ce295b37c546062
+size 232856903

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:66061e6a38529a523db921f29bebea1086e4753e60daff773ecfe8fb48ad0b10
-size 232315060

 version https://git-lfs.github.com/spec/v1
+oid sha256:c964f2c88afb32affe47ab3d531c48617ebe071b393ad5eec09c1e410948b4bf
+size 232865860

quantize_config.json CHANGED Viewed

@@ -1,98 +1,98 @@
 {
-    "per_channel": false,
-    "reduce_range": false,
     "per_model_config": {
         "decoder_model": {
             "op_types": [
                 "Add",
-                "Shape",
-                "Where",
-                "Sub",
-                "Unsqueeze",
-                "Equal",
-                "Concat",
-                "Reshape",
-                "Softmax",
                 "Constant",
-                "Tanh",
-                "Gather",
-                "CumSum",
-                "Squeeze",
-                "Sqrt",
-                "Cast",
-                "Slice",
                 "Split",
-                "Transpose",
                 "ConstantOfShape",
-                "Mul",
-                "Div",
                 "MatMul",
-                "And",
-                "Pow",
-                "ReduceMean"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
                 "Add",
-                "Shape",
-                "Where",
-                "Sub",
-                "Unsqueeze",
-                "Equal",
-                "Concat",
-                "Reshape",
-                "Softmax",
                 "Constant",
-                "Tanh",
-                "Gather",
-                "CumSum",
-                "Squeeze",
-                "Sqrt",
-                "Cast",
-                "Slice",
                 "Split",
-                "Transpose",
                 "ConstantOfShape",
-                "If",
-                "Mul",
-                "Div",
                 "MatMul",
-                "And",
-                "Pow",
-                "ReduceMean"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
                 "Add",
-                "Shape",
-                "Where",
-                "Sub",
-                "Unsqueeze",
-                "Equal",
-                "Concat",
-                "Reshape",
-                "Softmax",
                 "Constant",
-                "Tanh",
-                "Gather",
-                "Squeeze",
-                "CumSum",
-                "Sqrt",
-                "Slice",
-                "Cast",
                 "Split",
-                "Transpose",
                 "ConstantOfShape",
-                "Mul",
-                "Div",
                 "MatMul",
-                "And",
-                "Pow",
-                "ReduceMean"
             ],
             "weight_type": "QInt8"
         }

 {
+    "per_channel": true,
+    "reduce_range": true,
     "per_model_config": {
         "decoder_model": {
             "op_types": [
+                "Transpose",
+                "ReduceMean",
+                "Div",
+                "Gather",
+                "And",
                 "Add",
                 "Constant",
+                "Mul",
+                "Concat",
+                "Sub",
                 "Split",
+                "Pow",
+                "Tanh",
                 "ConstantOfShape",
+                "Softmax",
+                "Cast",
+                "Sqrt",
+                "Equal",
+                "Squeeze",
+                "Shape",
                 "MatMul",
+                "Where",
+                "Reshape",
+                "Unsqueeze",
+                "Slice",
+                "CumSum"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
+                "Transpose",
+                "ReduceMean",
+                "Div",
+                "Gather",
+                "And",
                 "Add",
                 "Constant",
+                "Mul",
+                "Concat",
+                "If",
+                "Sub",
                 "Split",
+                "Pow",
+                "Tanh",
                 "ConstantOfShape",
+                "Softmax",
+                "Cast",
+                "Sqrt",
+                "Equal",
+                "Squeeze",
+                "Shape",
                 "MatMul",
+                "Where",
+                "Reshape",
+                "Unsqueeze",
+                "Slice",
+                "CumSum"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Transpose",
+                "ReduceMean",
+                "Div",
+                "Gather",
+                "And",
                 "Add",
                 "Constant",
+                "Mul",
+                "Concat",
+                "Sub",
                 "Split",
+                "Pow",
+                "Tanh",
                 "ConstantOfShape",
+                "Softmax",
+                "Cast",
+                "Sqrt",
+                "Equal",
+                "Squeeze",
+                "Shape",
                 "MatMul",
+                "Where",
+                "Reshape",
+                "Unsqueeze",
+                "Slice",
+                "CumSum"
             ],
             "weight_type": "QInt8"
         }