Upload folder using huggingface_hub

Browse files

Files changed (11) hide show

config.json +2 -2
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
onnx/encoder_model.onnx +1 -1
onnx/encoder_model_quantized.onnx +2 -2
quantize_config.json +139 -0

config.json CHANGED Viewed

@@ -3,6 +3,7 @@
   "architectures": [
     "T5ForConditionalGeneration"
   ],
   "d_ff": 2816,
   "d_kv": 64,
   "d_model": 1024,
@@ -25,8 +26,7 @@
   "relative_attention_max_distance": 128,
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
-  "torch_dtype": "float32",
-  "transformers_version": "4.28.1",
   "use_cache": true,
   "vocab_size": 32128
 }

   "architectures": [
     "T5ForConditionalGeneration"
   ],
+  "classifier_dropout": 0.0,
   "d_ff": 2816,
   "d_kv": 64,
   "d_model": 1024,
   "relative_attention_max_distance": 128,
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
+  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 32128
 }

generation_config.json CHANGED Viewed

@@ -3,5 +3,5 @@
   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
-  "transformers_version": "4.28.1"
 }

   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:643891f8024e09fcaaf21c7400aea149d8cc88595c2c585db5f82efb4619ce25
-size 1899966406

 version https://git-lfs.github.com/spec/v1
+oid sha256:0af2d5176759dac258e16aa9b5421584e608a20bb8d1234871df44bf7cf2ef05
+size 1899966097

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4f8428ae370f32d9abf39c3353c390bb40889b352f40bbb3da5da09dc5330529
-size 1900612838

 version https://git-lfs.github.com/spec/v1
+oid sha256:7d5e34da7b389b73d0aa02aaf5e8e6d42c1299294f77f116772cdf36686d25c2
+size 1900612149

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f01eaef9c2c32baab84ec9101c67b1371a74cd9b437cfa71156dfef6419449ff
-size 477408072

 version https://git-lfs.github.com/spec/v1
+oid sha256:a0455d53b1b0c7edcbcf5b7a17816685f33f49d39da811eb1c2efa3dc35fb85c
+size 479350955

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:345d3af616c67a79077f0f636994ea71319caae37d590d07bfc3625fc7dd5ba1
-size 476285658

 version https://git-lfs.github.com/spec/v1
+oid sha256:fb80680a2cb37392ad0a1ccb36e291a8ca14fff50848a1fe943110d042c91b95
+size 478228998

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4b1612f3b65f5565745241e15fa8fca805ed339dce89c3d35b5c82fc774f19b8
-size 1698575820

 version https://git-lfs.github.com/spec/v1
+oid sha256:450dff530ac7190bac7689ecf04f1b5ba3cd484dee7ce073ca2a46009a4fdb2b
+size 1698575515

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f05b0ca08d0e219c48781697ae40aa5663f55016cecbc2c17abfd34c7b62a425
-size 425822799

 version https://git-lfs.github.com/spec/v1
+oid sha256:ce085b88aaf7e1bb564a8c8580ff60129e2191ae85404253060457b5c57f0ee3
+size 427520153

onnx/encoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:95c00dc87260918560692d0ab24eaebb4c2f3cd8588a832e29ba7186f86cce68
 size 1365283172

 version https://git-lfs.github.com/spec/v1
+oid sha256:c58209b472cdf3e7fea925f109fe7ee67d12d99368ccd8d18a18c75cce6a9e51
 size 1365283172

onnx/encoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:26af9fa17778b65326f0e79746b0cc03b9fc8e3812a1c843b9135a5cf57300b5
-size 342049899

 version https://git-lfs.github.com/spec/v1
+oid sha256:c913a4d58ce74bb978125292667050e426692e95bec67a70388569b3cad82034
+size 343340979

quantize_config.json ADDED Viewed

	@@ -0,0 +1,139 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Add",
+                "Less",
+                "ConstantOfShape",
+                "Mul",
+                "Pow",
+                "Gather",
+                "Shape",
+                "ReduceMean",
+                "MatMul",
+                "Range",
+                "Transpose",
+                "Neg",
+                "Expand",
+                "Sqrt",
+                "Min",
+                "Unsqueeze",
+                "Where",
+                "Div",
+                "Tile",
+                "Log",
+                "Concat",
+                "Cast",
+                "LessOrEqual",
+                "Reshape",
+                "Sub",
+                "Softmax",
+                "Tanh",
+                "Constant"
+            ],
+            "weight_type": "QInt8"
+        },
+        "encoder_model": {
+            "op_types": [
+                "Add",
+                "Abs",
+                "Less",
+                "ConstantOfShape",
+                "Mul",
+                "Pow",
+                "Gather",
+                "Shape",
+                "ReduceMean",
+                "MatMul",
+                "Range",
+                "Transpose",
+                "Sqrt",
+                "Min",
+                "Unsqueeze",
+                "Where",
+                "Div",
+                "Greater",
+                "Log",
+                "Concat",
+                "Cast",
+                "Reshape",
+                "Sub",
+                "Softmax",
+                "Tanh",
+                "Constant"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "If",
+                "Add",
+                "Less",
+                "ConstantOfShape",
+                "Mul",
+                "Slice",
+                "Pow",
+                "Gather",
+                "Shape",
+                "ReduceMean",
+                "MatMul",
+                "Range",
+                "Transpose",
+                "Neg",
+                "Expand",
+                "Sqrt",
+                "Min",
+                "Unsqueeze",
+                "Where",
+                "Div",
+                "Tile",
+                "Log",
+                "Concat",
+                "Cast",
+                "LessOrEqual",
+                "Reshape",
+                "Sub",
+                "Softmax",
+                "Tanh",
+                "Constant"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Add",
+                "Less",
+                "ConstantOfShape",
+                "Mul",
+                "Slice",
+                "Pow",
+                "Gather",
+                "Shape",
+                "ReduceMean",
+                "MatMul",
+                "Range",
+                "Transpose",
+                "Neg",
+                "Expand",
+                "Sqrt",
+                "Min",
+                "Unsqueeze",
+                "Where",
+                "Div",
+                "Tile",
+                "Log",
+                "Concat",
+                "Cast",
+                "LessOrEqual",
+                "Reshape",
+                "Sub",
+                "Softmax",
+                "Tanh",
+                "Constant"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}