Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +125 -0

config.json CHANGED Viewed

@@ -63,7 +63,7 @@
       "num_beams": 4
     }
   },
-  "transformers_version": "4.29.2",
   "use_cache": true,
   "vocab_size": 50264
 }

       "num_beams": 4
     }
   },
+  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 50264
 }

generation_config.json CHANGED Viewed

@@ -12,5 +12,5 @@
   "no_repeat_ngram_size": 3,
   "num_beams": 4,
   "pad_token_id": 1,
-  "transformers_version": "4.29.2"
 }

   "no_repeat_ngram_size": 3,
   "num_beams": 4,
   "pad_token_id": 1,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ace1c96cc44f533ae223f5ebb9db35f4c5cf8e0592284e662c5bae667e06444d
-size 1222931015

 version https://git-lfs.github.com/spec/v1
+oid sha256:37c6b1e1db55c314a525a1981d87e69f332370dfda38c1616d0842be5b790263
+size 1017091776

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f68d519a785d2458cc515dc6d3a1d439d6e2efa0d859d7e7661429dcbe2701dc
-size 1223372254

 version https://git-lfs.github.com/spec/v1
+oid sha256:33c7c9b29bcb80c28b0a8ed7ea5306b2a121985fd3f0ecf53b47f019fe860806
+size 1017574814

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9402d1f0255de4221901a31a6b64c941a427930c57444f994934ccb1e2abaae3
-size 309046228

 version https://git-lfs.github.com/spec/v1
+oid sha256:d747cb8cefbf557f8d3ade8efbd43f9a0a0fbdd6deb7503682071647ee0a7cdc
+size 257435745

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:77ab4286473c981329253666bff6763d8b997b322673df9fe0ea86da566bf167
-size 308343853

 version https://git-lfs.github.com/spec/v1
+oid sha256:f0f1596ac223b3ebfd0dab8b14bcf865550bdf0cd23ea9b535a33208b7e7866a
+size 256677944

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2d359d786187e502b60514333fe1d9bb37439467b552136969b6700455744b51
-size 1122089918

 version https://git-lfs.github.com/spec/v1
+oid sha256:f33a93db6d4d0715f99f5ddc29de8f3b08fa9c57407e513d8d22c75e39a8493b
+size 916250419

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9af3c60d51963ce72b6b16fbf0c8586ebc395b7e890e416e476b71603b5c1dd4
-size 282825152

 version https://git-lfs.github.com/spec/v1
+oid sha256:e8e8a8b67b5cc287398e1b018495a82264babe2db2806c18265f63ebd37f4cfe
+size 231158860

quantize_config.json ADDED Viewed

	@@ -0,0 +1,125 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Constant",
+                "Sub",
+                "Expand",
+                "ConstantOfShape",
+                "ReduceMean",
+                "Sqrt",
+                "Cast",
+                "Reshape",
+                "Pow",
+                "Range",
+                "Softmax",
+                "Erf",
+                "Shape",
+                "Squeeze",
+                "Less",
+                "Mul",
+                "Where",
+                "Slice",
+                "Gather",
+                "Unsqueeze",
+                "Transpose",
+                "Add",
+                "Concat",
+                "MatMul",
+                "Div",
+                "Equal"
+            ],
+            "weight_type": "QInt8"
+        },
+        "encoder_model": {
+            "op_types": [
+                "Constant",
+                "Sub",
+                "Expand",
+                "ConstantOfShape",
+                "ReduceMean",
+                "Sqrt",
+                "Reshape",
+                "Cast",
+                "Pow",
+                "Range",
+                "Softmax",
+                "Erf",
+                "Shape",
+                "Mul",
+                "Where",
+                "Gather",
+                "Unsqueeze",
+                "Transpose",
+                "Add",
+                "Concat",
+                "MatMul",
+                "Div",
+                "Equal"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Constant",
+                "Sub",
+                "Expand",
+                "ConstantOfShape",
+                "If",
+                "ReduceMean",
+                "Sqrt",
+                "Cast",
+                "Reshape",
+                "Pow",
+                "Range",
+                "Softmax",
+                "Erf",
+                "Shape",
+                "Squeeze",
+                "Less",
+                "Mul",
+                "Where",
+                "Slice",
+                "Gather",
+                "Unsqueeze",
+                "Transpose",
+                "Add",
+                "Concat",
+                "MatMul",
+                "Div",
+                "Equal"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Constant",
+                "Sub",
+                "Expand",
+                "ConstantOfShape",
+                "ReduceMean",
+                "Sqrt",
+                "Reshape",
+                "Cast",
+                "Pow",
+                "Range",
+                "Softmax",
+                "Erf",
+                "Shape",
+                "Mul",
+                "Where",
+                "Gather",
+                "Unsqueeze",
+                "Transpose",
+                "Add",
+                "Concat",
+                "MatMul",
+                "Div",
+                "Equal"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}