Upload folder using huggingface_hub

Browse files

Files changed (5) hide show

onnx/decoder_model_merged.onnx +1 -1
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +104 -0

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e918f5de08de4cb6fcae6db006f9618bf55015a517903bae5b9576ac71a2fd6b
 size 1399393

 version https://git-lfs.github.com/spec/v1
+oid sha256:7b5440b416feb4f24695692b176225f518deafed3c017cea8ba6d5fe0151cf81
 size 1399393

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:46bbf11c9e9fb14f36e2e9428b3eead8e90342f6554369d8aa1ff34606635e03
-size 821504874

 version https://git-lfs.github.com/spec/v1
+oid sha256:a93ddbe77bb8359c687418bf7592b46f5bd3e5ea2fe8dbf62ea682c73b8cc3ea
+size 819144015

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a83014d55c5fa9fc9264040513b9b7bd5eff1d9d4da78d66acfae8410c222efa
-size 820477030

 version https://git-lfs.github.com/spec/v1
+oid sha256:e3f054fdc6afd82cbbf5f23b6f32770fff798d7620e2457c838fb5b5a0facec3
+size 818116171

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f981dcad0360bd9da6f48d95f457fd0a9590c29d4ef9fb9114b95e42f125328f
-size 820479158

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ffe8bf5750be07cc010c1d018e16e45d13fe8f2ecdde7ae904693fe6a31055a
+size 818118299

quantize_config.json ADDED Viewed

	@@ -0,0 +1,104 @@

+{
+    "per_channel": false,
+    "reduce_range": false,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "ScatterND",
+                "ReduceMean",
+                "Transpose",
+                "Expand",
+                "CumSum",
+                "Softmax",
+                "Gather",
+                "Reshape",
+                "Tanh",
+                "Unsqueeze",
+                "Cast",
+                "Pow",
+                "Equal",
+                "Concat",
+                "Constant",
+                "Slice",
+                "Sub",
+                "Range",
+                "Sqrt",
+                "Not",
+                "Mul",
+                "Div",
+                "Less",
+                "Or",
+                "MatMul",
+                "Shape",
+                "Add",
+                "Where",
+                "ConstantOfShape"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "ScatterND",
+                "ReduceMean",
+                "Transpose",
+                "Expand",
+                "CumSum",
+                "Softmax",
+                "Gather",
+                "Reshape",
+                "Tanh",
+                "Unsqueeze",
+                "Cast",
+                "Pow",
+                "Equal",
+                "Concat",
+                "Constant",
+                "Slice",
+                "Sub",
+                "Range",
+                "Sqrt",
+                "Not",
+                "Mul",
+                "If",
+                "Div",
+                "Less",
+                "Or",
+                "MatMul",
+                "Shape",
+                "Add",
+                "Where",
+                "ConstantOfShape"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "ReduceMean",
+                "Transpose",
+                "Expand",
+                "CumSum",
+                "Softmax",
+                "Gather",
+                "Reshape",
+                "Tanh",
+                "Unsqueeze",
+                "Cast",
+                "Pow",
+                "Equal",
+                "Concat",
+                "Constant",
+                "Sub",
+                "Sqrt",
+                "Not",
+                "Mul",
+                "Div",
+                "MatMul",
+                "Shape",
+                "Add",
+                "Where",
+                "ConstantOfShape"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}