Upload folder using huggingface_hub

Browse files

Files changed (7) hide show

onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +74 -74

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a34147806885ea37601ae6d91a2598a93acc78db07a06e637f2f1e6ef9c90699
-size 819581461

 version https://git-lfs.github.com/spec/v1
+oid sha256:3b2ceb285d8c3b54dc13baad904077f9fc0b3d926ff193e4345c9bca9c2f8dc0
+size 613700175

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2c15a6f30dad41c3265f6786dbd850b6c563d9e6cca0197a1517822ccf2cb44b
-size 819827967

 version https://git-lfs.github.com/spec/v1
+oid sha256:32a8b5910c88ced64a7f8507dcc1fa785fa612fc27797105a2b7daf1843b8b0b
+size 613946766

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:06a8b2aad1811a49576bb1fae43142bd91fc90204065a363191268ee84a7cd28
-size 206825235

 version https://git-lfs.github.com/spec/v1
+oid sha256:7a584dce621f77e39008055b6ef4ae9d3698241758e568edf3e5b0ad5fd6ccb2
+size 155102167

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b704da825ee605a2576a88093fed2442978b00309d3a576337ae2fe1ac843fcf
-size 206437988

 version https://git-lfs.github.com/spec/v1
+oid sha256:034156c203b082ef11ac78e46cfffc96dd2f83f2c6c5a1d16401eef97291ae5e
+size 154715574

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:145e78c5a35e7bd92f57f58b17b9538c202ccd2e4b233b8f4deb2d91e3454a32
-size 769158110

 version https://git-lfs.github.com/spec/v1
+oid sha256:009480ed2abb7b8a20f127de89cf202b60f719ccf642813c332a5672f4d1506d
+size 563276824

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8615325c7835f7734c6c6ed53264dc85f9954db1f176697cf033fc596fc7f52c
-size 193674668

 version https://git-lfs.github.com/spec/v1
+oid sha256:58a6832ec3a2e328322bae85925ad82b71622f0a535ccca65fa88bf082ee7c41
+size 141952254

quantize_config.json CHANGED Viewed

@@ -4,120 +4,120 @@
     "per_model_config": {
         "decoder_model": {
             "op_types": [
-                "Cast",
-                "Transpose",
-                "Slice",
-                "Concat",
                 "Unsqueeze",
                 "Where",
-                "Pow",
-                "Expand",
-                "MatMul",
-                "Sub",
                 "Div",
-                "Equal",
-                "Mul",
-                "Gather",
                 "Constant",
-                "Softmax",
                 "Shape",
-                "Squeeze",
-                "ConstantOfShape",
-                "Range",
-                "Less",
-                "Add",
                 "Sqrt",
                 "Reshape",
-                "ReduceMean",
-                "Erf"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model_merged": {
             "op_types": [
-                "Cast",
-                "If",
-                "Transpose",
-                "Slice",
-                "Concat",
                 "Unsqueeze",
                 "Where",
-                "Pow",
-                "Expand",
-                "MatMul",
-                "Sub",
                 "Div",
-                "Equal",
-                "Mul",
-                "Gather",
                 "Constant",
-                "Softmax",
                 "Shape",
-                "Squeeze",
-                "ConstantOfShape",
-                "Range",
-                "Less",
-                "Add",
                 "Sqrt",
                 "Reshape",
-                "ReduceMean",
-                "Erf"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_with_past_model": {
             "op_types": [
-                "Cast",
-                "Transpose",
-                "Concat",
                 "Unsqueeze",
                 "Where",
-                "Pow",
-                "Expand",
-                "MatMul",
-                "Sub",
                 "Div",
-                "Equal",
-                "Mul",
-                "Gather",
                 "Constant",
-                "Softmax",
                 "Shape",
-                "ConstantOfShape",
-                "Range",
-                "Add",
                 "Sqrt",
                 "Reshape",
-                "ReduceMean",
-                "Erf"
             ],
             "weight_type": "QInt8"
         },
-        "encoder_model": {
             "op_types": [
-                "Cast",
-                "Transpose",
-                "Concat",
                 "Unsqueeze",
                 "Where",
-                "Pow",
-                "Expand",
-                "MatMul",
-                "Sub",
                 "Div",
-                "Equal",
-                "Mul",
-                "Gather",
                 "Constant",
-                "Softmax",
                 "Shape",
-                "ConstantOfShape",
-                "Range",
-                "Add",
                 "Sqrt",
                 "Reshape",
-                "ReduceMean",
-                "Erf"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "decoder_model": {
             "op_types": [
+                "Range",
+                "Less",
+                "Pow",
                 "Unsqueeze",
+                "ConstantOfShape",
+                "Squeeze",
                 "Where",
                 "Div",
+                "ReduceMean",
                 "Constant",
+                "Cast",
+                "Slice",
+                "Erf",
+                "MatMul",
                 "Shape",
+                "Softmax",
                 "Sqrt",
+                "Sub",
                 "Reshape",
+                "Transpose",
+                "Expand",
+                "Mul",
+                "Gather",
+                "Equal",
+                "Concat",
+                "Add"
             ],
             "weight_type": "QInt8"
         },
+        "encoder_model": {
             "op_types": [
+                "Range",
+                "Pow",
                 "Unsqueeze",
+                "ConstantOfShape",
                 "Where",
                 "Div",
+                "ReduceMean",
                 "Constant",
+                "Cast",
+                "Erf",
+                "MatMul",
                 "Shape",
+                "Softmax",
                 "Sqrt",
+                "Sub",
                 "Reshape",
+                "Transpose",
+                "Expand",
+                "Gather",
+                "Mul",
+                "Equal",
+                "Concat",
+                "Add"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Range",
+                "Less",
+                "Pow",
                 "Unsqueeze",
+                "ConstantOfShape",
+                "Squeeze",
                 "Where",
                 "Div",
+                "ReduceMean",
                 "Constant",
+                "Cast",
+                "Slice",
+                "Erf",
+                "MatMul",
                 "Shape",
+                "Softmax",
                 "Sqrt",
+                "Sub",
                 "Reshape",
+                "Transpose",
+                "If",
+                "Expand",
+                "Mul",
+                "Gather",
+                "Equal",
+                "Concat",
+                "Add"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_with_past_model": {
             "op_types": [
+                "Range",
+                "Pow",
                 "Unsqueeze",
+                "ConstantOfShape",
                 "Where",
                 "Div",
+                "ReduceMean",
                 "Constant",
+                "Cast",
+                "Erf",
+                "MatMul",
                 "Shape",
+                "Softmax",
                 "Sqrt",
+                "Sub",
                 "Reshape",
+                "Transpose",
+                "Expand",
+                "Mul",
+                "Gather",
+                "Equal",
+                "Concat",
+                "Add"
             ],
             "weight_type": "QInt8"
         }