Upload folder using huggingface_hub

Browse files

Files changed (8) hide show

onnx/model.onnx +3 -0
onnx/model_bnb4.onnx +3 -0
onnx/model_fp16.onnx +3 -0
onnx/model_int8.onnx +3 -0
onnx/model_q4.onnx +3 -0
onnx/model_quantized.onnx +3 -0
onnx/model_uint8.onnx +3 -0
quantize_config.json +129 -0

onnx/model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dcfd5ab88829855a3a5964dbb03ae6a5bf89c4c68604c5a295c19c0b9df2992e
+size 46434169

onnx/model_bnb4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:89be01958da262ae0b131377dde126d29301cf1386fc7b9138618b6ca1fa4599
+size 39225852

onnx/model_fp16.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7d221711133a3e43b8ffce46ea67a000327a092dabb97c9894e5a20efe39e1e2
+size 23324980

onnx/model_int8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9b7d10236df94549d01fb111239a91902a8703dff785391c4d2f4f7ff5ed4c2d
+size 12057342

onnx/model_q4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff449dfdd1f70c699d64c8919559d3b95a678f2a1b2f63db93d134cc34d9202e
+size 39356894

onnx/model_quantized.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:203ae59f5c9c1f864e22e8c846d16669ca86ded5475f90d4918d02998d247e98
+size 12057392

onnx/model_uint8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:203ae59f5c9c1f864e22e8c846d16669ca86ded5475f90d4918d02998d247e98
+size 12057392

quantize_config.json ADDED Viewed

	@@ -0,0 +1,129 @@

+{
+    "fp16": {},
+    "q8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "BatchNormalization",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Erf",
+                    "Flatten",
+                    "Gather",
+                    "Gemm",
+                    "GlobalAveragePool",
+                    "Identity",
+                    "MatMul",
+                    "Mul",
+                    "ReduceMean",
+                    "Relu",
+                    "Reshape",
+                    "Shape",
+                    "Sigmoid",
+                    "Slice",
+                    "Softmax",
+                    "Split",
+                    "Sqrt",
+                    "Squeeze",
+                    "Sub",
+                    "Transpose",
+                    "Unsqueeze"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "int8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "BatchNormalization",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Erf",
+                    "Flatten",
+                    "Gather",
+                    "Gemm",
+                    "GlobalAveragePool",
+                    "Identity",
+                    "MatMul",
+                    "Mul",
+                    "ReduceMean",
+                    "Relu",
+                    "Reshape",
+                    "Shape",
+                    "Sigmoid",
+                    "Slice",
+                    "Softmax",
+                    "Split",
+                    "Sqrt",
+                    "Squeeze",
+                    "Sub",
+                    "Transpose",
+                    "Unsqueeze"
+                ],
+                "weight_type": "QInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "uint8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "BatchNormalization",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Erf",
+                    "Flatten",
+                    "Gather",
+                    "Gemm",
+                    "GlobalAveragePool",
+                    "Identity",
+                    "MatMul",
+                    "Mul",
+                    "ReduceMean",
+                    "Relu",
+                    "Reshape",
+                    "Shape",
+                    "Sigmoid",
+                    "Slice",
+                    "Softmax",
+                    "Split",
+                    "Sqrt",
+                    "Squeeze",
+                    "Sub",
+                    "Transpose",
+                    "Unsqueeze"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "q4": {
+        "block_size": 32,
+        "is_symmetric": true,
+        "accuracy_level": null
+    },
+    "bnb4": {
+        "block_size": 64,
+        "quant_type": 1
+    }
+}