Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +97 -0

config.json CHANGED Viewed

@@ -25,7 +25,7 @@
   "summary_proj_to_labels": true,
   "summary_type": "cls_index",
   "summary_use_proj": true,
-  "transformers_version": "4.29.2",
   "use_cache": false,
   "vocab_size": 50258
 }

   "summary_proj_to_labels": true,
   "summary_type": "cls_index",
   "summary_use_proj": true,
+  "transformers_version": "4.33.0.dev0",
   "use_cache": false,
   "vocab_size": 50258
 }

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
-  "transformers_version": "4.29.2"
 }

   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9d0c146c6685128082c6bda07a1f282173b3d1d1cd88da5ebeb7ab9800afbf62
-size 1247366820

 version https://git-lfs.github.com/spec/v1
+oid sha256:a99a231b8a22a1f402c6583f803380062c514a44064202e2e8b7ec2a566bbf89
+size 1028642499

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7ece03bf266aeebfaa7443a6b1407ed691c0847a3eded5532e78ec6b3af639a0
-size 1247911554

 version https://git-lfs.github.com/spec/v1
+oid sha256:eae2f16345fbce32265ff480f7eeb495876009558c36b8f18df26222aa221fa0
+size 1033379856

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7f1d3ea9ddd90714ffaed4c9802d5180ce6f60cbda07cc1e2809082262acc162
-size 318018578

 version https://git-lfs.github.com/spec/v1
+oid sha256:c223b1e05ad637eb36a858a336a6f0e64e2de373d7416ee9a7d42228a71226bf
+size 266589262

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:042ac11cfd8cf883c7e2f78f8e8016a9cf141b7b4a8ec47b4b4d543b4032be65
-size 317201341

 version https://git-lfs.github.com/spec/v1
+oid sha256:638646a1d7305a136fc1f425f462b2adfb9ceb8e072904af47aa7801edcfb24d
+size 261580710

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:27b1b45c132dbc07666091dd94713a3edb392e1502e4b2d90713a6fcc245aaf2
-size 1247374623

 version https://git-lfs.github.com/spec/v1
+oid sha256:f87c69f6ff5915e9918216a2a8ba89f3d226621ddbfe74062782dee3ef1432aa
+size 1028650304

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8aab704b43ee7838c336ad96d38eab71c3f1a27e1b024d1bec01d2e125c38014
-size 317211702

 version https://git-lfs.github.com/spec/v1
+oid sha256:5d0c85b35fc50e18ace78d839b5de103d6368a8507e2722ad63a3bac7e15a155
+size 261591073

quantize_config.json ADDED Viewed

	@@ -0,0 +1,97 @@

+{
+    "per_channel": false,
+    "reduce_range": false,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Add",
+                "Erf",
+                "Mul",
+                "Constant",
+                "Sqrt",
+                "Gemm",
+                "Split",
+                "Where",
+                "Transpose",
+                "Sub",
+                "Gather",
+                "ConstantOfShape",
+                "Slice",
+                "Pow",
+                "ReduceMean",
+                "Concat",
+                "Cast",
+                "Squeeze",
+                "Shape",
+                "Range",
+                "MatMul",
+                "Reshape",
+                "Unsqueeze",
+                "Softmax",
+                "Div"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Add",
+                "Erf",
+                "Mul",
+                "Constant",
+                "Sqrt",
+                "Gemm",
+                "Split",
+                "Where",
+                "Transpose",
+                "Sub",
+                "Gather",
+                "ConstantOfShape",
+                "Slice",
+                "Pow",
+                "ReduceMean",
+                "Concat",
+                "Cast",
+                "Squeeze",
+                "Shape",
+                "Range",
+                "MatMul",
+                "If",
+                "Reshape",
+                "Unsqueeze",
+                "Softmax",
+                "Div"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Add",
+                "Erf",
+                "Mul",
+                "Constant",
+                "Sqrt",
+                "Gemm",
+                "Split",
+                "Where",
+                "Transpose",
+                "Sub",
+                "Gather",
+                "ConstantOfShape",
+                "Slice",
+                "Pow",
+                "ReduceMean",
+                "Concat",
+                "Cast",
+                "Squeeze",
+                "Shape",
+                "Range",
+                "MatMul",
+                "Reshape",
+                "Unsqueeze",
+                "Softmax",
+                "Div"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}