Upload folder using huggingface_hub

Files changed (3) hide show

onnx/decoder_model_merged.onnx ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b2fcbd6764d2434b969d5851e948e9ccab5779b356f6b586efe696ee6d15380f
+size 1873498357

onnx/decoder_model_merged_quantized.onnx ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:033aeddccff186b769d5b0d5a18a8098b5d550bfafe03dde5986089adb98810e
+size 482326148

quantize_config.json CHANGED Viewed

@@ -4,33 +4,33 @@
     "per_model_config": {
         "model": {
             "op_types": [
-                "ConstantOfShape",
-                "Where",
-                "Softmax",
-                "Add",
-                "Mul",
-                "Concat",
-                "Trilu",
-                "Constant",
-                "Shape",
-                "MatMul",
-                "Sigmoid",
-                "Reshape",
-                "Less",
-                "Unsqueeze",
                 "Sub",
-                "Pow",
-                "ReduceMean",
-                "Expand",
-                "Range",
                 "Div",
-                "Squeeze",
                 "Equal",
                 "Cast",
-                "Neg",
-                "Slice",
-                "Gather",
                 "Sqrt",
                 "Transpose"
             ],
             "weight_type": "QInt8"

     "per_model_config": {
         "model": {
             "op_types": [
                 "Sub",
                 "Div",
+                "MatMul",
                 "Equal",
+                "Expand",
+                "ReduceMean",
+                "Squeeze",
+                "Pow",
                 "Cast",
+                "Reshape",
+                "Trilu",
+                "Where",
                 "Sqrt",
+                "Range",
+                "Gather",
+                "Unsqueeze",
+                "Mul",
+                "Sigmoid",
+                "Shape",
+                "Slice",
+                "ConstantOfShape",
+                "Softmax",
+                "Add",
+                "Neg",
+                "Constant",
+                "Concat",
+                "Less",
                 "Transpose"
             ],
             "weight_type": "QInt8"