Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +1 -1
generation_config.json +2 -2
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +65 -65
tokenizer.json +0 -0

config.json CHANGED Viewed

@@ -53,7 +53,7 @@
   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
-  "transformers_version": "4.32.0.dev0",
   "use_cache": true,
   "vocab_size": 65001
 }

   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
+  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 65001
 }

generation_config.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "_from_model_config": true,
   "bad_words_ids": [
     [
       65000
@@ -12,5 +11,6 @@
   "max_length": 512,
   "num_beams": 4,
   "pad_token_id": 65000,
-  "transformers_version": "4.32.0.dev0"
 }

 {
   "bad_words_ids": [
     [
       65000
   "max_length": 512,
   "num_beams": 4,
   "pad_token_id": 65000,
+  "renormalize_logits": true,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:efd85b3ea1ad8a7482a306144d48bc5c1c22c5536921c1eb5a02aabd64041b5b
-size 368725660

 version https://git-lfs.github.com/spec/v1
+oid sha256:8bd0a586aac3cf44f89fe59319b5fd2297968c00dabd4f0c2a5fd227848891e1
+size 235603669

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9b7f52b2928ea2148dadaf7ac79fb9e752c63a8acfab62a9763ba77781abb0f4
-size 368961142

 version https://git-lfs.github.com/spec/v1
+oid sha256:9010a890e540f69db9a8fa2708b11acc41189b685abb59755ef8383ff5399ce0
+size 235839236

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:14479d793e08b11cda59f3634f490f28ad2fc64f53dfad046853e16a794d9fd6
-size 93819733

 version https://git-lfs.github.com/spec/v1
+oid sha256:58759988d510656029ef9ea744efdda9fd66dbfb689333abe7fb29bca7b239f3
+size 60212804

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4cb7e6d213215b29586154c99b17461ef0a9d535a25bb2c6ebcff0d13355db9c
-size 93448377

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c8c3a0502f385dce8dd2a6b4546aaa69423c7097b5f0b0c77c3f097ce68ddde
+size 59842102

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:464008a53bf8942ad80f8482503d2e84dec241e4a2e92d5009e517f6545d0edb
-size 356075151

 version https://git-lfs.github.com/spec/v1
+oid sha256:aeda5ce52ef5a2eb77c782d8be8d2e6aac2ab655f41c0164bdef2d1037e0bd9f
+size 222953160

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ec0cfa5ad9a54f64db7df4e39c44af79cfd1f4deb428fdf4ae2cc91d342b41ea
-size 90176913

 version https://git-lfs.github.com/spec/v1
+oid sha256:97c8776c2ee02d070370bf3135ade8d3e4d8f1bd45308c82c160b78972839ed3
+size 56570638

quantize_config.json CHANGED Viewed

@@ -4,120 +4,120 @@
     "per_model_config": {
         "encoder_model": {
             "op_types": [
-                "Concat",
-                "Equal",
                 "Expand",
-                "Sigmoid",
                 "Add",
                 "Constant",
                 "MatMul",
                 "Cast",
                 "Unsqueeze",
-                "Reshape",
-                "Shape",
                 "Sub",
                 "ConstantOfShape",
-                "Where",
-                "Transpose",
-                "Pow",
                 "Mul",
-                "Div",
-                "Softmax",
-                "ReduceMean",
-                "Sqrt",
-                "Gather",
-                "Range"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
-                "Concat",
-                "Equal",
                 "Expand",
-                "Sigmoid",
                 "Add",
                 "Constant",
                 "MatMul",
                 "Cast",
                 "Unsqueeze",
-                "Reshape",
-                "Shape",
                 "Sub",
                 "ConstantOfShape",
-                "Where",
-                "Transpose",
-                "Pow",
                 "Mul",
-                "Div",
-                "Softmax",
-                "ReduceMean",
-                "Sqrt",
-                "Gather",
-                "Range"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model": {
             "op_types": [
-                "Concat",
-                "Equal",
                 "Expand",
-                "Slice",
-                "Sigmoid",
                 "Add",
                 "Constant",
-                "Less",
                 "MatMul",
                 "Cast",
-                "Squeeze",
                 "Unsqueeze",
-                "Reshape",
-                "Shape",
                 "Sub",
                 "ConstantOfShape",
-                "Where",
-                "Transpose",
-                "Pow",
                 "Mul",
-                "Div",
-                "Softmax",
-                "ReduceMean",
-                "Sqrt",
-                "Gather",
-                "Range"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model_merged": {
             "op_types": [
-                "Concat",
-                "Equal",
                 "Expand",
-                "Slice",
-                "Sigmoid",
-                "If",
                 "Add",
                 "Constant",
-                "Less",
                 "MatMul",
                 "Cast",
-                "Squeeze",
                 "Unsqueeze",
-                "Reshape",
-                "Shape",
                 "Sub",
                 "ConstantOfShape",
-                "Where",
-                "Transpose",
-                "Pow",
                 "Mul",
-                "Div",
-                "Softmax",
-                "ReduceMean",
-                "Sqrt",
-                "Gather",
-                "Range"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "encoder_model": {
             "op_types": [
+                "Sqrt",
+                "Shape",
+                "Div",
+                "Reshape",
                 "Expand",
+                "Pow",
                 "Add",
+                "Equal",
+                "Where",
                 "Constant",
                 "MatMul",
+                "ReduceMean",
                 "Cast",
+                "Range",
+                "Transpose",
                 "Unsqueeze",
+                "Gather",
                 "Sub",
+                "Sigmoid",
                 "ConstantOfShape",
+                "Concat",
                 "Mul",
+                "Softmax"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Sqrt",
+                "Shape",
+                "Div",
+                "Reshape",
                 "Expand",
+                "Pow",
                 "Add",
+                "Equal",
+                "Where",
                 "Constant",
                 "MatMul",
+                "ReduceMean",
                 "Cast",
+                "Range",
+                "Transpose",
                 "Unsqueeze",
+                "Gather",
                 "Sub",
+                "Sigmoid",
                 "ConstantOfShape",
+                "Concat",
                 "Mul",
+                "Softmax"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Sqrt",
+                "Shape",
+                "Div",
+                "Reshape",
                 "Expand",
+                "Pow",
                 "Add",
+                "Equal",
+                "Softmax",
+                "Where",
                 "Constant",
                 "MatMul",
+                "ReduceMean",
+                "Less",
                 "Cast",
+                "Range",
+                "Transpose",
                 "Unsqueeze",
+                "Gather",
                 "Sub",
+                "If",
+                "Sigmoid",
                 "ConstantOfShape",
+                "Squeeze",
+                "Concat",
                 "Mul",
+                "Slice"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model": {
             "op_types": [
+                "Sqrt",
+                "Shape",
+                "Div",
+                "Reshape",
                 "Expand",
+                "Pow",
                 "Add",
+                "Equal",
+                "Softmax",
+                "Where",
                 "Constant",
                 "MatMul",
+                "ReduceMean",
+                "Less",
                 "Cast",
+                "Range",
+                "Transpose",
                 "Unsqueeze",
+                "Gather",
                 "Sub",
+                "Sigmoid",
                 "ConstantOfShape",
+                "Squeeze",
+                "Concat",
                 "Mul",
+                "Slice"
             ],
             "weight_type": "QInt8"
         }

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff