Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +1 -1
generation_config.json +2 -2
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +73 -73
tokenizer.json +0 -0

config.json CHANGED Viewed

@@ -54,7 +54,7 @@
   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
-  "transformers_version": "4.32.0.dev0",
   "use_cache": true,
   "vocab_size": 62518
 }

   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
+  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 62518
 }

generation_config.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "_from_model_config": true,
   "bad_words_ids": [
     [
       62517
@@ -12,5 +11,6 @@
   "max_length": 512,
   "num_beams": 4,
   "pad_token_id": 62517,
-  "transformers_version": "4.32.0.dev0"
 }

 {
   "bad_words_ids": [
     [
       62517
   "max_length": 512,
   "num_beams": 4,
   "pad_token_id": 62517,
+  "renormalize_logits": true,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b52cd4f14c3dd176917bd33db3f0cead8b13912488c38b409e181aa6e4b4492b
-size 358545360

 version https://git-lfs.github.com/spec/v1
+oid sha256:2014f22836434baa54069071525be0dd2a540e5bff30862c4fa06456262ba234
+size 230508553

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:12ab2f2ce821aacfc16a73db855dcbae2e4264a790128d319751d66f75c0307c
-size 358780842

 version https://git-lfs.github.com/spec/v1
+oid sha256:0686150fa652d177b0a9eee70f81851d921d2ad169535697a109e3c9878be581
+size 230744120

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a2e3b48cb7ce2f3cbcc5f515431bd80eb14f6f37ac4a89813b061046aeed1226
-size 91254794

 version https://git-lfs.github.com/spec/v1
+oid sha256:7efefcd793a5663bc204224a92a123524f3dfe2ffad59e5f73d6734d1b11ad04
+size 58931576

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e0b716fe5a5c22ecc17dd12e18ed424da84776ffa07ffa27a5b02d9fd2a50b68
-size 90883438

 version https://git-lfs.github.com/spec/v1
+oid sha256:7e4e602c31130176b086cd4bf31d6d08d44a6a367617e910870e0ea3e5408574
+size 58560874

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:566461b2841ecb55692cf8a6c7ebe9acb72cee05b2159d82852d081871c5a733
-size 345894851

 version https://git-lfs.github.com/spec/v1
+oid sha256:8f6941f135f722de84bf26191c340a4fe7958aa10918872db284a9698795665d
+size 217858044

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:99f14fe0f43ec1e1e19d8706712ce82ecdf6bfbd088a98f15101b6720d0dc574
-size 87611974

 version https://git-lfs.github.com/spec/v1
+oid sha256:7946cca821e951629360b4bd12e7965318f777c06c4f0d5443c82197b3b8f169
+size 55289410

quantize_config.json CHANGED Viewed

@@ -4,120 +4,120 @@
     "per_model_config": {
         "encoder_model": {
             "op_types": [
-                "ConstantOfShape",
-                "Gather",
-                "Sqrt",
-                "Reshape",
                 "Div",
-                "Expand",
                 "Range",
                 "Sub",
-                "Sigmoid",
-                "Softmax",
-                "Pow",
-                "Shape",
-                "ReduceMean",
                 "MatMul",
-                "Unsqueeze",
-                "Concat",
-                "Cast",
-                "Mul",
-                "Constant",
-                "Add",
                 "Equal",
                 "Transpose",
-                "Where"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
-                "ConstantOfShape",
-                "Gather",
-                "Sqrt",
-                "Reshape",
                 "Div",
                 "Range",
-                "Expand",
                 "Sub",
-                "Sigmoid",
-                "Softmax",
-                "Pow",
-                "Shape",
-                "ReduceMean",
                 "MatMul",
-                "Unsqueeze",
-                "Concat",
-                "Cast",
-                "Mul",
-                "Constant",
-                "Add",
                 "Equal",
                 "Transpose",
-                "Where"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model": {
             "op_types": [
-                "Slice",
-                "ConstantOfShape",
-                "Gather",
-                "Sqrt",
-                "Reshape",
                 "Div",
-                "Expand",
                 "Range",
                 "Sub",
-                "Sigmoid",
-                "Softmax",
-                "Pow",
-                "Shape",
-                "ReduceMean",
                 "MatMul",
-                "Unsqueeze",
-                "Concat",
                 "Squeeze",
                 "Less",
-                "Cast",
                 "Mul",
-                "Constant",
-                "Add",
-                "Equal",
                 "Transpose",
-                "Where"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model_merged": {
             "op_types": [
-                "Slice",
-                "ConstantOfShape",
-                "Gather",
-                "Sqrt",
-                "Reshape",
                 "Div",
-                "Expand",
                 "Range",
                 "Sub",
-                "Sigmoid",
-                "Softmax",
-                "Pow",
-                "Shape",
-                "ReduceMean",
                 "MatMul",
-                "Unsqueeze",
-                "Concat",
                 "Squeeze",
                 "Less",
-                "Cast",
                 "Mul",
-                "Constant",
-                "Add",
-                "Equal",
                 "Transpose",
-                "If",
-                "Where"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "encoder_model": {
             "op_types": [
+                "Softmax",
+                "Cast",
+                "Unsqueeze",
                 "Div",
+                "Gather",
                 "Range",
                 "Sub",
                 "MatMul",
+                "Pow",
                 "Equal",
+                "Sigmoid",
+                "Where",
+                "Expand",
+                "Add",
+                "Mul",
+                "Concat",
                 "Transpose",
+                "ReduceMean",
+                "Sqrt",
+                "Constant",
+                "Shape",
+                "ConstantOfShape",
+                "Reshape"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Softmax",
+                "Cast",
+                "Unsqueeze",
                 "Div",
+                "Gather",
                 "Range",
                 "Sub",
                 "MatMul",
+                "Pow",
                 "Equal",
+                "Sigmoid",
+                "Where",
+                "Expand",
+                "Add",
+                "Mul",
+                "Concat",
                 "Transpose",
+                "ReduceMean",
+                "Sqrt",
+                "Constant",
+                "Shape",
+                "ConstantOfShape",
+                "Reshape"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Softmax",
+                "Cast",
+                "Unsqueeze",
                 "Div",
+                "Gather",
                 "Range",
                 "Sub",
+                "If",
                 "MatMul",
+                "Pow",
+                "Equal",
+                "Sigmoid",
+                "Where",
                 "Squeeze",
+                "Expand",
+                "Add",
                 "Less",
                 "Mul",
+                "Slice",
+                "Concat",
                 "Transpose",
+                "ReduceMean",
+                "Sqrt",
+                "Constant",
+                "Shape",
+                "ConstantOfShape",
+                "Reshape"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model": {
             "op_types": [
+                "Softmax",
+                "Cast",
+                "Unsqueeze",
                 "Div",
+                "Gather",
                 "Range",
                 "Sub",
                 "MatMul",
+                "Pow",
+                "Equal",
+                "Sigmoid",
+                "Where",
                 "Squeeze",
+                "Expand",
+                "Add",
                 "Less",
                 "Mul",
+                "Slice",
+                "Concat",
                 "Transpose",
+                "ReduceMean",
+                "Sqrt",
+                "Constant",
+                "Shape",
+                "ConstantOfShape",
+                "Reshape"
             ],
             "weight_type": "QInt8"
         }

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff