Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +2 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +139 -0

config.json CHANGED Viewed

@@ -3,6 +3,7 @@
   "architectures": [
     "T5ForConditionalGeneration"
   ],
   "d_ff": 2048,
   "d_kv": 64,
   "d_model": 512,
@@ -53,7 +54,7 @@
       "prefix": "translate English to Romanian: "
     }
   },
-  "transformers_version": "4.29.2",
   "use_cache": true,
   "vocab_size": 32128
 }

   "architectures": [
     "T5ForConditionalGeneration"
   ],
+  "classifier_dropout": 0.0,
   "d_ff": 2048,
   "d_kv": 64,
   "d_model": 512,
       "prefix": "translate English to Romanian: "
     }
   },
+  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 32128
 }

generation_config.json CHANGED Viewed

@@ -3,5 +3,5 @@
   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
-  "transformers_version": "4.29.2"
 }

   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:380ec9b11e607cc87169efd74c04634724ae40cc0e4ed22964a28f235701e7ab
-size 232468834

 version https://git-lfs.github.com/spec/v1
+oid sha256:937c37fbaf0a0e539e6019f604abc5285f4d13196aa2643674210449d8dbca66
+size 166670419

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ff0c5b93a304e8b08ee7f97e6bb0ed13d3a4343a3fb7c71e99b2cbbcf831068
-size 232631325

 version https://git-lfs.github.com/spec/v1
+oid sha256:e7366705cc2418efb8211fce9aea2050845edff8c74066903d608c024e54fa6d
+size 166832597

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:851c4f09c24d06dd56423d42991c6cc1baae3d2f54ce0315200acb9af08aa8e6
-size 59043179

 version https://git-lfs.github.com/spec/v1
+oid sha256:022ea05ec1c067113e03e4513c7a4c498044b316959de0a7c1dd1950e3308aa6
+size 42431407

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bae5d8a47b7d1ab4462be4779471f69ab6e72625a150eb64d206ee1eab6ed133
-size 58765649

 version https://git-lfs.github.com/spec/v1
+oid sha256:fe424ae0e0f10b6219a2a839c894df55c64158897bfd7dda6db155179cdb6bf4
+size 42154655

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:21793391fb0645b01924b80ece6307c1947a6ae725c82611323aa6d459a62fe3
-size 219874970

 version https://git-lfs.github.com/spec/v1
+oid sha256:05cca57c04b30f90263eb6cc4f460b90ab33b45d54368623dcc61d0154c8d5f5
+size 154076559

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5f02802ba62544115d0ca9b3acb3b08564c37ecf2fa897b901c08c08d9088dc3
-size 55563102

 version https://git-lfs.github.com/spec/v1
+oid sha256:5be205c8cd47b6a32d5e04abb36ff5aa07dd5613c87fe3191a81bc0a99c8f0ba
+size 38952122

quantize_config.json ADDED Viewed

	@@ -0,0 +1,139 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Constant",
+                "Concat",
+                "Shape",
+                "Transpose",
+                "Sqrt",
+                "Cast",
+                "Gather",
+                "LessOrEqual",
+                "MatMul",
+                "Less",
+                "Tile",
+                "Div",
+                "Unsqueeze",
+                "Reshape",
+                "Sub",
+                "Log",
+                "Min",
+                "Neg",
+                "Where",
+                "Add",
+                "Relu",
+                "Softmax",
+                "Range",
+                "Expand",
+                "ReduceMean",
+                "Pow",
+                "ConstantOfShape",
+                "Mul"
+            ],
+            "weight_type": "QInt8"
+        },
+        "encoder_model": {
+            "op_types": [
+                "Constant",
+                "Concat",
+                "Shape",
+                "Transpose",
+                "Sqrt",
+                "Cast",
+                "Gather",
+                "MatMul",
+                "Less",
+                "Div",
+                "Unsqueeze",
+                "Reshape",
+                "Sub",
+                "Abs",
+                "Log",
+                "Min",
+                "Where",
+                "Add",
+                "Greater",
+                "Relu",
+                "Softmax",
+                "Range",
+                "ReduceMean",
+                "Pow",
+                "ConstantOfShape",
+                "Mul"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Constant",
+                "Concat",
+                "If",
+                "Shape",
+                "Transpose",
+                "Sqrt",
+                "Cast",
+                "Gather",
+                "LessOrEqual",
+                "MatMul",
+                "Less",
+                "Tile",
+                "Slice",
+                "Div",
+                "Unsqueeze",
+                "Reshape",
+                "Sub",
+                "Log",
+                "Min",
+                "Neg",
+                "Where",
+                "Add",
+                "Relu",
+                "Softmax",
+                "Range",
+                "Expand",
+                "ReduceMean",
+                "Pow",
+                "ConstantOfShape",
+                "Mul"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Constant",
+                "Concat",
+                "Shape",
+                "Transpose",
+                "Sqrt",
+                "Cast",
+                "Gather",
+                "LessOrEqual",
+                "MatMul",
+                "Less",
+                "Tile",
+                "Slice",
+                "Div",
+                "Unsqueeze",
+                "Reshape",
+                "Sub",
+                "Log",
+                "Min",
+                "Neg",
+                "Where",
+                "Add",
+                "Relu",
+                "Softmax",
+                "Range",
+                "Expand",
+                "ReduceMean",
+                "Pow",
+                "ConstantOfShape",
+                "Mul"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}