Upload folder using huggingface_hub

Browse files

Files changed (7) hide show

onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +63 -63

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d094736e8b3b6e67e9c3b8a30259a053f06e7bd75d5efd4ea406b6dc441f8690
-size 314523257

 version https://git-lfs.github.com/spec/v1
+oid sha256:08ca2300844d32d52d5743bf6ec9a2c0953a11f90a031f82b98c4c373813a529
+size 208304195

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:eb8ca7ec5a9bcdc49011bc15946cf334a9cf908a5b0fff6d3165a0b178670913
-size 314779197

 version https://git-lfs.github.com/spec/v1
+oid sha256:a5df8d95539f2f87ec81663f676aab11772b766bced6b4ba21735255a6f317c4
+size 208560983

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a6134ef1ab4b1d7fa2f0aadfd15478537db3fe86793c251abf65630591767f6
-size 80262105

 version https://git-lfs.github.com/spec/v1
+oid sha256:4e2bd3a0083d3e31e9c3e29d089d1d44eb365a782781389f82fd5ed133f7589a
+size 53707540

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ff30d094886804d49108f957ac895bef102352e310c960a58e0f8856f3dd5670
-size 79864827

 version https://git-lfs.github.com/spec/v1
+oid sha256:d83958fa9b5279484cdc3b5923c903450663683d60980f29fdb1fe4b64cbdd9d
+size 53309878

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4adecec0758b3919d07f8d1127d3c34eb01e3f1ece2e874f60a3227ddd238dca
-size 301889972

 version https://git-lfs.github.com/spec/v1
+oid sha256:b90cf3b333790a022840a80a38947d5b3b262c9df9a0424af4aac2e617c984b3
+size 195670910

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d1b67629c24bba0294ec5f054933dc4ed17deb2861f6b8973ffca2ec98af5c46
-size 76643187

 version https://git-lfs.github.com/spec/v1
+oid sha256:4e46514e9301c3721972b6ddc044d2c37749374dda74fd0c9dc27b75c29d8e64
+size 50088238

quantize_config.json CHANGED Viewed

@@ -2,112 +2,112 @@
     "per_channel": false,
     "reduce_range": false,
     "per_model_config": {
-        "decoder_model_merged": {
             "op_types": [
                 "Gather",
-                "Shape",
-                "Cast",
                 "Reshape",
                 "Sqrt",
-                "Constant",
-                "Unsqueeze",
-                "Squeeze",
                 "Pow",
                 "Concat",
-                "MatMul",
-                "Erf",
-                "Range",
                 "Softmax",
                 "Sub",
-                "Less",
                 "Div",
-                "ReduceMean",
-                "If",
-                "Slice",
-                "Where",
-                "Add",
-                "Mul",
-                "Expand",
-                "ConstantOfShape",
-                "Transpose",
-                "Equal"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model": {
             "op_types": [
                 "Gather",
-                "Shape",
-                "Cast",
                 "Reshape",
                 "Sqrt",
-                "Constant",
-                "Unsqueeze",
-                "Squeeze",
                 "Pow",
                 "Concat",
-                "MatMul",
-                "Erf",
-                "Range",
                 "Softmax",
                 "Sub",
-                "Less",
                 "Div",
-                "ReduceMean",
-                "Slice",
-                "Where",
-                "Add",
-                "Mul",
-                "Expand",
-                "ConstantOfShape",
-                "Transpose",
-                "Equal"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
-                "Unsqueeze",
-                "Gather",
-                "Shape",
-                "Sub",
-                "Div",
-                "Reshape",
-                "Concat",
-                "ReduceMean",
-                "Pow",
-                "Mul",
                 "Slice",
                 "MatMul",
-                "Sqrt",
-                "Transpose",
                 "Add",
                 "Erf",
                 "Constant",
-                "Softmax"
             ],
             "weight_type": "QInt8"
         },
         "encoder_model": {
             "op_types": [
-                "Sub",
                 "Gather",
-                "Shape",
-                "Unsqueeze",
                 "Div",
                 "ReduceMean",
                 "Pow",
-                "Mul",
                 "Concat",
                 "Reshape",
-                "MatMul",
-                "Transpose",
-                "Sqrt",
-                "Add",
-                "Erf",
-                "Softmax",
                 "Constant",
-                "Conv"
             ],
             "weight_type": "QUInt8"
         }

     "per_channel": false,
     "reduce_range": false,
     "per_model_config": {
+        "decoder_model": {
             "op_types": [
+                "Expand",
                 "Gather",
+                "Squeeze",
+                "Range",
+                "Equal",
+                "MatMul",
+                "ConstantOfShape",
+                "Add",
+                "Erf",
+                "ReduceMean",
                 "Reshape",
+                "Cast",
+                "Transpose",
                 "Sqrt",
+                "Less",
                 "Pow",
                 "Concat",
+                "Slice",
                 "Softmax",
+                "Where",
                 "Sub",
                 "Div",
+                "Unsqueeze",
+                "Shape",
+                "Constant",
+                "Mul"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Expand",
                 "Gather",
+                "Squeeze",
+                "Range",
+                "Equal",
+                "MatMul",
+                "ConstantOfShape",
+                "Add",
+                "Erf",
+                "ReduceMean",
                 "Reshape",
+                "Cast",
+                "Transpose",
                 "Sqrt",
+                "Less",
                 "Pow",
                 "Concat",
+                "Slice",
                 "Softmax",
+                "Where",
                 "Sub",
                 "Div",
+                "If",
+                "Unsqueeze",
+                "Shape",
+                "Constant",
+                "Mul"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Sqrt",
                 "Slice",
                 "MatMul",
+                "Softmax",
+                "Gather",
                 "Add",
+                "Sub",
+                "Pow",
+                "ReduceMean",
+                "Div",
                 "Erf",
+                "Concat",
+                "Reshape",
+                "Unsqueeze",
+                "Shape",
                 "Constant",
+                "Mul",
+                "Transpose"
             ],
             "weight_type": "QInt8"
         },
         "encoder_model": {
             "op_types": [
+                "Sqrt",
+                "Conv",
+                "MatMul",
+                "Softmax",
                 "Gather",
+                "Add",
+                "Erf",
                 "Div",
                 "ReduceMean",
+                "Sub",
                 "Pow",
                 "Concat",
                 "Reshape",
+                "Shape",
                 "Constant",
+                "Mul",
+                "Unsqueeze",
+                "Transpose"
             ],
             "weight_type": "QUInt8"
         }