Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +97 -0

config.json CHANGED Viewed

@@ -32,7 +32,7 @@
       "max_length": 50
     }
   },
-  "transformers_version": "4.29.2",
   "use_cache": true,
   "vocab_size": 50257
 }

       "max_length": 50
     }
   },
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "vocab_size": 50257
 }

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
-  "transformers_version": "4.29.2"
 }

   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fd9d2cc37ed20cf78f52c9f424c61b1605fe88cbce371729198ded0549fed5d9
-size 653666800

 version https://git-lfs.github.com/spec/v1
+oid sha256:b6c4c75bafa80ef5098219808b83d702f0a11524de52c21603ff30e2813213f7
+size 499275976

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:02058bf4773cf0665bd536d1290411ac587a144573590e5fff5e2b18201ef231
-size 654142857

 version https://git-lfs.github.com/spec/v1
+oid sha256:d6aa1de057398705e99e1088f7ff2ef1a04edb19f7a4f2a0ae36fdd76c8d0349
+size 500799139

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b25d2fad539d895cad1969530dc77508b5524e06f581215349b503a8f52547d0
-size 166536066

 version https://git-lfs.github.com/spec/v1
+oid sha256:3633bbcb515767629ce17ff7ac1c3bd337f260a1135fb8c76fd9fe0dab876d19
+size 128315766

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8d5cd0010dac8c74efd687589b5dcee35e4480c313c7afb7e611cacbd6980792
-size 165823091

 version https://git-lfs.github.com/spec/v1
+oid sha256:419f6a0fe721ce9f41f35512347c58132b2e178310454231ca6ec04ff5029445
+size 126556880

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:11ed625b30dcdc8777a608c4b3667626faec14d4e9fd7be2e586731fdc9e1700
-size 653673608

 version https://git-lfs.github.com/spec/v1
+oid sha256:9640de43faceabd4ebab467d3b5517dcad4e9eaa1d254e6762640a6965ece3f9
+size 499282782

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7721b8afee3c3ab47485e52e07422e2631f49955865d6fcff20f7c9bd69c82f6
-size 165832141

 version https://git-lfs.github.com/spec/v1
+oid sha256:f65bfa5c0d033ca3db23ece03d34c12d87ea2e7b3007b8944e4a9122ee64e029
+size 126565928

quantize_config.json ADDED Viewed

	@@ -0,0 +1,97 @@

+{
+    "per_channel": false,
+    "reduce_range": false,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Pow",
+                "Sqrt",
+                "Softmax",
+                "Shape",
+                "Concat",
+                "Gather",
+                "ReduceMean",
+                "Div",
+                "MatMul",
+                "Slice",
+                "Transpose",
+                "Mul",
+                "Sub",
+                "Constant",
+                "ConstantOfShape",
+                "Tanh",
+                "Reshape",
+                "Where",
+                "Squeeze",
+                "Split",
+                "Range",
+                "Cast",
+                "Add",
+                "Gemm",
+                "Unsqueeze"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Pow",
+                "Sqrt",
+                "Softmax",
+                "Shape",
+                "Concat",
+                "Gather",
+                "ReduceMean",
+                "Div",
+                "MatMul",
+                "Slice",
+                "Transpose",
+                "Mul",
+                "Sub",
+                "Constant",
+                "ConstantOfShape",
+                "Tanh",
+                "Reshape",
+                "Where",
+                "Squeeze",
+                "If",
+                "Range",
+                "Split",
+                "Cast",
+                "Add",
+                "Gemm",
+                "Unsqueeze"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Pow",
+                "Sqrt",
+                "Softmax",
+                "Shape",
+                "Concat",
+                "Gather",
+                "ReduceMean",
+                "Div",
+                "MatMul",
+                "Slice",
+                "Transpose",
+                "Mul",
+                "Sub",
+                "Constant",
+                "ConstantOfShape",
+                "Tanh",
+                "Reshape",
+                "Where",
+                "Squeeze",
+                "Split",
+                "Range",
+                "Cast",
+                "Add",
+                "Gemm",
+                "Unsqueeze"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}