Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +1 -1
generation_config.json +2 -2
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +75 -75
tokenizer.json +0 -0

config.json CHANGED Viewed

@@ -54,7 +54,7 @@
   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
-  "transformers_version": "4.32.0.dev0",
   "use_cache": true,
   "vocab_size": 37745
 }

   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
+  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 37745
 }

generation_config.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "_from_model_config": true,
   "bad_words_ids": [
     [
       37744
@@ -12,5 +11,6 @@
   "max_length": 512,
   "num_beams": 4,
   "pad_token_id": 37744,
-  "transformers_version": "4.32.0.dev0"
 }

 {
   "bad_words_ids": [
     [
       37744
   "max_length": 512,
   "num_beams": 4,
   "pad_token_id": 37744,
+  "renormalize_logits": true,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:caad18fa59833b4ab7effcf5fd77ba9d8dec3c1d318ba5e98664b4ce47a16b82
-size 256976059

 version https://git-lfs.github.com/spec/v1
+oid sha256:99750cd9e5c6a6c6f492a03bf08532932fe2d8f00fe42297bb3dedf1935180e4
+size 179674357

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f1f288e6ce9d4ca9f38305c90acc6c0ec1d85d7ba4aa5c8671f0889c26c4f749
-size 257211541

 version https://git-lfs.github.com/spec/v1
+oid sha256:410f1cbcef22d8214b6bebf61f939d5bdf2f607e9ddb91ef9e1763af02e2a2b2
+size 179909924

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b1dd6baa3bc101c080b8dc0fe607a0fce3b59de95c493cbce329820367ceba7f
-size 65664285

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c0291f2524b6c9843e32bc843f6a5f07db89ccb781caf15b325e5a25302e7ef
+size 46148708

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c19b7aa331cee07571ae165a9cb4dcdc95b535afe63d3abccb76085bff653a24
-size 65292929

 version https://git-lfs.github.com/spec/v1
+oid sha256:fe92f12d8b5733d0913d8ab1865d1dd0ca376c9ba9f4bd5ef37d725562e3288a
+size 45778006

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39a069ed8b04189564f3e27d1b46560703c3f6de976e239a5aaaf882e2a5d9a3
-size 244325550

 version https://git-lfs.github.com/spec/v1
+oid sha256:9c681aab60969591cf1c4df987e650ab8bd0bab8d7e3a2c0adce1e4bb3f26009
+size 167023848

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c1a572d7518233863a962db9a13104383d85556e9ef570f8593c5ee4dff28e90
-size 62021465

 version https://git-lfs.github.com/spec/v1
+oid sha256:38aee00bba12e88fd8a3712649ad6e9117dba4b804b3f6263abbab8c2340ca80
+size 42506542

quantize_config.json CHANGED Viewed

@@ -4,120 +4,120 @@
     "per_model_config": {
         "encoder_model": {
             "op_types": [
-                "Sqrt",
-                "Shape",
                 "Mul",
-                "Pow",
-                "Range",
                 "Constant",
-                "MatMul",
-                "Add",
-                "Div",
-                "Gather",
-                "Where",
-                "Sigmoid",
                 "ConstantOfShape",
-                "Sub",
-                "Cast",
-                "Unsqueeze",
                 "Transpose",
                 "Expand",
-                "Softmax",
-                "ReduceMean",
-                "Equal",
                 "Reshape",
-                "Concat"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
-                "Sqrt",
-                "Shape",
                 "Mul",
-                "Pow",
-                "Range",
                 "Constant",
-                "MatMul",
-                "Add",
-                "Div",
-                "Gather",
-                "Where",
-                "Sigmoid",
                 "ConstantOfShape",
-                "Sub",
-                "Cast",
-                "Unsqueeze",
                 "Transpose",
                 "Expand",
-                "Softmax",
-                "ReduceMean",
-                "Equal",
                 "Reshape",
-                "Concat"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model": {
             "op_types": [
-                "Sqrt",
-                "Shape",
                 "Mul",
-                "Pow",
-                "Range",
-                "Slice",
                 "Constant",
-                "MatMul",
-                "Add",
-                "Div",
-                "Gather",
-                "Where",
-                "Sigmoid",
                 "ConstantOfShape",
-                "Sub",
                 "Less",
-                "Cast",
-                "Unsqueeze",
                 "Transpose",
-                "Squeeze",
                 "Expand",
-                "Softmax",
-                "ReduceMean",
-                "Equal",
                 "Reshape",
-                "Concat"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model_merged": {
             "op_types": [
-                "Sqrt",
-                "Shape",
                 "Mul",
-                "Pow",
-                "Range",
-                "Slice",
                 "Constant",
-                "MatMul",
-                "Add",
-                "Div",
-                "Gather",
-                "Where",
-                "Sigmoid",
                 "ConstantOfShape",
-                "Sub",
                 "Less",
-                "Cast",
-                "Unsqueeze",
                 "Transpose",
-                "Squeeze",
                 "Expand",
-                "Softmax",
-                "ReduceMean",
-                "Equal",
-                "If",
                 "Reshape",
-                "Concat"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "encoder_model": {
             "op_types": [
+                "Concat",
                 "Mul",
+                "Shape",
                 "Constant",
+                "Softmax",
+                "Equal",
                 "ConstantOfShape",
+                "Pow",
+                "Where",
                 "Transpose",
                 "Expand",
+                "Sqrt",
+                "Gather",
+                "Div",
+                "Cast",
+                "Sigmoid",
+                "Range",
                 "Reshape",
+                "Unsqueeze",
+                "Add",
+                "ReduceMean",
+                "MatMul",
+                "Sub"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Concat",
                 "Mul",
+                "Shape",
                 "Constant",
+                "Softmax",
+                "Equal",
                 "ConstantOfShape",
+                "Pow",
+                "Where",
                 "Transpose",
                 "Expand",
+                "Sqrt",
+                "Gather",
+                "Div",
+                "Cast",
+                "Sigmoid",
+                "Range",
                 "Reshape",
+                "Unsqueeze",
+                "Add",
+                "ReduceMean",
+                "MatMul",
+                "Sub"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Concat",
                 "Mul",
+                "Shape",
                 "Constant",
+                "Softmax",
+                "Equal",
                 "ConstantOfShape",
+                "Squeeze",
+                "Pow",
                 "Less",
+                "Where",
                 "Transpose",
                 "Expand",
+                "Sqrt",
+                "Gather",
+                "Div",
+                "Cast",
+                "Sigmoid",
+                "Range",
                 "Reshape",
+                "Unsqueeze",
+                "Add",
+                "If",
+                "ReduceMean",
+                "MatMul",
+                "Slice",
+                "Sub"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model": {
             "op_types": [
+                "Concat",
                 "Mul",
+                "Shape",
                 "Constant",
+                "Softmax",
+                "Equal",
                 "ConstantOfShape",
+                "Squeeze",
+                "Pow",
                 "Less",
+                "Where",
                 "Transpose",
                 "Expand",
+                "Sqrt",
+                "Gather",
+                "Div",
+                "Cast",
+                "Sigmoid",
+                "Range",
                 "Reshape",
+                "Unsqueeze",
+                "Add",
+                "ReduceMean",
+                "MatMul",
+                "Slice",
+                "Sub"
             ],
             "weight_type": "QInt8"
         }

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff