Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +66 -66

config.json CHANGED Viewed

@@ -31,7 +31,7 @@
   "summary_proj_to_labels": true,
   "summary_type": "cls_index",
   "summary_use_proj": true,
-  "transformers_version": "4.32.0.dev0",
   "use_cache": true,
   "validate_runner_input": true,
   "vocab_size": 49152

   "summary_proj_to_labels": true,
   "summary_type": "cls_index",
   "summary_use_proj": true,
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "validate_runner_input": true,
   "vocab_size": 49152

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 0,
   "eos_token_id": 0,
-  "transformers_version": "4.32.0.dev0"
 }

   "_from_model_config": true,
   "bos_token_id": 0,
   "eos_token_id": 0,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:086035920a278bf46877997575337c46cad5ffc746367a188da646df349f0cda
-size 875006955

 version https://git-lfs.github.com/spec/v1
+oid sha256:994ccba5ea418052a3e1839b1b3c8b4c39342c8537fadf2dacec898daa64ca67
+size 724012077

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e852014acc486bff04ac66ea20bb8e7a8b4b755d608efc404352439f586cbe20
-size 942448642

 version https://git-lfs.github.com/spec/v1
+oid sha256:1b0f375b96dd3a76b25f4d5377eda6376faae560682bed258510f0bbd8289470
+size 791453859

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:45cf095deb2100ff660c231e8bff39af026c8848ad10ffaf57e89749c1e1c3e5
-size 338500911

 version https://git-lfs.github.com/spec/v1
+oid sha256:be7061281a908c61b62bd0bc9dea7a707a72d55a374deab3ccfaec173acc2aa2
+size 299954775

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4910505d4c3186dd789d1d3dfc3e834eca200549185f43beb09bb3bd3e5edd49
-size 270851872

 version https://git-lfs.github.com/spec/v1
+oid sha256:6889a8fdc9daf18b7aa3c6124684eaffd0fb2fba6ee0103064ad719d79d7bf0a
+size 232306103

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:94f2798827a11f474b4e8a98f02182b66982c6f934fc959d2b2b74d016afbbd0
-size 875014307

 version https://git-lfs.github.com/spec/v1
+oid sha256:a326b8671e0a683b78557edf7ae89d86172a09451931d1744839ce45c6c42fc9
+size 724019429

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bfc393be238b4a5bd3337c1165a8b17cd63a907a847a6b38b539f8cfe39c6be3
-size 270860829

 version https://git-lfs.github.com/spec/v1
+oid sha256:66061e6a38529a523db921f29bebea1086e4753e60daff773ecfe8fb48ad0b10
+size 232315060

quantize_config.json CHANGED Viewed

@@ -1,98 +1,98 @@
 {
-    "per_channel": true,
-    "reduce_range": true,
     "per_model_config": {
-        "decoder_with_past_model": {
             "op_types": [
-                "CumSum",
-                "ConstantOfShape",
-                "Cast",
-                "Gather",
-                "ReduceMean",
-                "Reshape",
-                "Concat",
-                "Div",
-                "Squeeze",
                 "Unsqueeze",
                 "Equal",
-                "Pow",
                 "Constant",
-                "MatMul",
-                "Sub",
-                "And",
-                "Slice",
                 "Tanh",
-                "Add",
                 "Split",
                 "Mul",
-                "Shape",
-                "Softmax",
-                "Sqrt",
-                "Where",
-                "Transpose"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model": {
             "op_types": [
-                "CumSum",
-                "ConstantOfShape",
-                "Cast",
-                "Gather",
-                "ReduceMean",
-                "Reshape",
-                "Concat",
-                "Div",
-                "Squeeze",
                 "Unsqueeze",
                 "Equal",
-                "Pow",
                 "Constant",
-                "MatMul",
-                "Sub",
-                "And",
-                "Slice",
                 "Tanh",
-                "Add",
                 "Split",
                 "Mul",
-                "Shape",
-                "Softmax",
-                "Sqrt",
-                "Where",
-                "Transpose"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model_merged": {
             "op_types": [
-                "CumSum",
-                "ConstantOfShape",
-                "Cast",
-                "Gather",
-                "ReduceMean",
-                "Reshape",
-                "Concat",
-                "Div",
-                "Squeeze",
-                "If",
                 "Unsqueeze",
                 "Equal",
-                "Pow",
                 "Constant",
-                "MatMul",
-                "Sub",
-                "And",
-                "Slice",
                 "Tanh",
-                "Add",
                 "Split",
                 "Mul",
-                "Shape",
-                "Softmax",
-                "Sqrt",
-                "Where",
-                "Transpose"
             ],
             "weight_type": "QInt8"
         }

 {
+    "per_channel": false,
+    "reduce_range": false,
     "per_model_config": {
+        "decoder_model": {
             "op_types": [
+                "Add",
+                "Shape",
+                "Where",
+                "Sub",
                 "Unsqueeze",
                 "Equal",
+                "Concat",
+                "Reshape",
+                "Softmax",
                 "Constant",
                 "Tanh",
+                "Gather",
+                "CumSum",
+                "Squeeze",
+                "Sqrt",
+                "Cast",
+                "Slice",
                 "Split",
+                "Transpose",
+                "ConstantOfShape",
                 "Mul",
+                "Div",
+                "MatMul",
+                "And",
+                "Pow",
+                "ReduceMean"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Add",
+                "Shape",
+                "Where",
+                "Sub",
                 "Unsqueeze",
                 "Equal",
+                "Concat",
+                "Reshape",
+                "Softmax",
                 "Constant",
                 "Tanh",
+                "Gather",
+                "CumSum",
+                "Squeeze",
+                "Sqrt",
+                "Cast",
+                "Slice",
                 "Split",
+                "Transpose",
+                "ConstantOfShape",
+                "If",
                 "Mul",
+                "Div",
+                "MatMul",
+                "And",
+                "Pow",
+                "ReduceMean"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_with_past_model": {
             "op_types": [
+                "Add",
+                "Shape",
+                "Where",
+                "Sub",
                 "Unsqueeze",
                 "Equal",
+                "Concat",
+                "Reshape",
+                "Softmax",
                 "Constant",
                 "Tanh",
+                "Gather",
+                "Squeeze",
+                "CumSum",
+                "Sqrt",
+                "Slice",
+                "Cast",
                 "Split",
+                "Transpose",
+                "ConstantOfShape",
                 "Mul",
+                "Div",
+                "MatMul",
+                "And",
+                "Pow",
+                "ReduceMean"
             ],
             "weight_type": "QInt8"
         }