Upload folder using huggingface_hub

Browse files

Files changed (8) hide show

onnx/model.onnx +3 -0
onnx/model_bnb4.onnx +3 -0
onnx/model_fp16.onnx +3 -0
onnx/model_int8.onnx +3 -0
onnx/model_q4.onnx +3 -0
onnx/model_quantized.onnx +3 -0
onnx/model_uint8.onnx +3 -0
quantize_config.json +90 -0

onnx/model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e44631a1a62f85c35f8f147f086a697e556c881079d29f786426bdd8934e3c90
+size 30291205

onnx/model_bnb4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e9063679d074d7516e97d537a2f13d8b316281a5fc617566e67aaf566993add8
+size 30291224

onnx/model_fp16.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4d489e89eb5250b7db458f835ee0eb27016e0af05e16afbdda7cc6fef36a8fcd
+size 15229540

onnx/model_int8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1d16cba523e28b6fa1af7730c434788080cdcefe3193851d13aca27fc4a54572
+size 7990828

onnx/model_q4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e9063679d074d7516e97d537a2f13d8b316281a5fc617566e67aaf566993add8
+size 30291224

onnx/model_quantized.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e37777e83a9ef29901d91e595eb909c026fd2dbbf9a4bd2899a8fd7ffb9f5f93
+size 7990872

onnx/model_uint8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e37777e83a9ef29901d91e595eb909c026fd2dbbf9a4bd2899a8fd7ffb9f5f93
+size 7990872

quantize_config.json ADDED Viewed

	@@ -0,0 +1,90 @@

+{
+    "fp16": {},
+    "q8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "BatchNormalization",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Erf",
+                    "Flatten",
+                    "Gemm",
+                    "GlobalAveragePool",
+                    "Identity",
+                    "Mul",
+                    "ReduceMean",
+                    "Relu",
+                    "Sigmoid",
+                    "Sub"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "int8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "BatchNormalization",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Erf",
+                    "Flatten",
+                    "Gemm",
+                    "GlobalAveragePool",
+                    "Identity",
+                    "Mul",
+                    "ReduceMean",
+                    "Relu",
+                    "Sigmoid",
+                    "Sub"
+                ],
+                "weight_type": "QInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "uint8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "BatchNormalization",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Erf",
+                    "Flatten",
+                    "Gemm",
+                    "GlobalAveragePool",
+                    "Identity",
+                    "Mul",
+                    "ReduceMean",
+                    "Relu",
+                    "Sigmoid",
+                    "Sub"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "q4": {
+        "block_size": 32,
+        "is_symmetric": true,
+        "accuracy_level": null
+    },
+    "bnb4": {
+        "block_size": 64,
+        "quant_type": 1
+    }
+}