Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +57 -56
tokenizer.json +3 -3

config.json CHANGED Viewed

@@ -19,7 +19,7 @@
   "rope_scaling": null,
   "rope_theta": 10000.0,
   "tie_word_embeddings": true,
-  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 32000
 }

   "rope_scaling": null,
   "rope_theta": 10000.0,
   "tie_word_embeddings": true,
+  "transformers_version": "4.33.2",
   "use_cache": true,
   "vocab_size": 32000
 }

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
-  "transformers_version": "4.34.0.dev0"
 }

   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
+  "transformers_version": "4.33.2"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2875c864cfa242d3ce797f1c8f47c8779bc4d4d22bedffc7c5220d3405a4b1de
-size 167565936

 version https://git-lfs.github.com/spec/v1
+oid sha256:9993acfcd14528ac8bcefc4a6a8bdeddc2e6aada567c8d9e0c601dd0ec603562
+size 167566461

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:315d6c6d96edac7ab954841322d443a69102c059e8ac20ba89faf3f0236769aa
-size 168376680

 version https://git-lfs.github.com/spec/v1
+oid sha256:c4da7ec2fab9370e45b7e8fbcc1a787e19ad6283aff523b08f9373df9b963849
+size 168377675

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b5e81e0464c3028cd88b9f457a8770a16c268258c0fdc290ca04035bdbb575f3
-size 43636490

 version https://git-lfs.github.com/spec/v1
+oid sha256:a5d2095b1db3b264342e0aab8779bdaa311fb3117ae9faddd9e2da26ebd943f8
+size 43637900

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:44b2bc266767e042cb7277e7234c916ca678841ccaef3bc1f3e76bfe6c41f689
-size 42675110

 version https://git-lfs.github.com/spec/v1
+oid sha256:83784ee0b2b115606e5b69d3d5565e99c826d7aa7e1de5437c12b0a964c28c1d
+size 42675859

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7c13e4732ed2e01643955726fa276efa3f3bf49279e42c837ef50893f292b71a
-size 167568570

 version https://git-lfs.github.com/spec/v1
+oid sha256:92d8434248807a07f0a85468cdbdd138171cb2d48c6b25165b99088821346991
+size 167568998

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:886b10a41ecb479dffa829513765f4e445ddcef1c972d5b95aadd10eecd854df
-size 42677756

 version https://git-lfs.github.com/spec/v1
+oid sha256:7d5689e151084aa2dbf309f6f54f13fea852af91d00ebc2c4f5d9f7e96a39044
+size 42678372

quantize_config.json CHANGED Viewed

@@ -5,100 +5,101 @@
         "decoder_with_past_model": {
             "op_types": [
                 "Unsqueeze",
-                "Pow",
-                "If",
-                "Gather",
-                "Constant",
-                "Squeeze",
-                "Reshape",
-                "Slice",
                 "Neg",
-                "ConstantOfShape",
-                "Sigmoid",
                 "Softmax",
                 "Identity",
-                "Sub",
-                "Cast",
                 "Expand",
-                "Div",
                 "Mul",
-                "Add",
                 "Shape",
-                "Sqrt",
-                "Where",
-                "Equal",
                 "MatMul",
                 "Concat",
-                "Transpose",
-                "ReduceMean"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model": {
             "op_types": [
                 "Unsqueeze",
-                "Pow",
-                "If",
-                "Gather",
-                "Constant",
-                "Squeeze",
-                "Reshape",
-                "Slice",
-                "Less",
                 "Neg",
-                "ConstantOfShape",
-                "Sigmoid",
                 "Softmax",
                 "Identity",
-                "Sub",
                 "Expand",
-                "Div",
                 "Mul",
-                "Add",
                 "Shape",
-                "Sqrt",
-                "Where",
-                "Equal",
                 "MatMul",
-                "Concat",
                 "Range",
-                "Transpose",
                 "Cast",
-                "ReduceMean"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
                 "Unsqueeze",
-                "Pow",
-                "If",
-                "Gather",
-                "Constant",
-                "Squeeze",
-                "Reshape",
-                "Slice",
-                "Less",
                 "Neg",
-                "ConstantOfShape",
-                "Sigmoid",
                 "Softmax",
                 "Identity",
-                "Sub",
                 "Expand",
-                "Div",
                 "Mul",
-                "Add",
                 "Shape",
-                "Sqrt",
-                "Where",
-                "Equal",
                 "MatMul",
-                "Concat",
                 "Range",
-                "Transpose",
                 "Cast",
-                "ReduceMean"
             ],
             "weight_type": "QInt8"
         }

         "decoder_with_past_model": {
             "op_types": [
                 "Unsqueeze",
+                "Transpose",
                 "Neg",
                 "Softmax",
+                "If",
                 "Identity",
                 "Expand",
+                "Where",
+                "Constant",
                 "Mul",
                 "Shape",
+                "Sigmoid",
                 "MatMul",
+                "Div",
+                "Squeeze",
+                "Range",
+                "Sub",
+                "Pow",
+                "Gather",
                 "Concat",
+                "ReduceMean",
+                "ConstantOfShape",
+                "Reshape",
+                "Sqrt",
+                "Cast",
+                "Slice",
+                "Add",
+                "Equal"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model": {
             "op_types": [
                 "Unsqueeze",
+                "Transpose",
                 "Neg",
+                "Less",
+                "If",
                 "Softmax",
                 "Identity",
                 "Expand",
+                "Where",
+                "Constant",
                 "Mul",
                 "Shape",
+                "Sigmoid",
                 "MatMul",
+                "Div",
+                "Squeeze",
                 "Range",
+                "Sub",
+                "Pow",
+                "Gather",
+                "Concat",
+                "ReduceMean",
+                "ConstantOfShape",
+                "Reshape",
+                "Slice",
                 "Cast",
+                "Sqrt",
+                "Add",
+                "Equal"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
                 "Unsqueeze",
+                "Transpose",
                 "Neg",
+                "Less",
+                "If",
                 "Softmax",
                 "Identity",
                 "Expand",
+                "Where",
+                "Constant",
                 "Mul",
                 "Shape",
+                "Sigmoid",
                 "MatMul",
+                "Div",
+                "Squeeze",
                 "Range",
+                "Sub",
+                "Pow",
+                "Gather",
+                "Concat",
+                "ReduceMean",
+                "ConstantOfShape",
+                "Reshape",
+                "Slice",
                 "Cast",
+                "Sqrt",
+                "Add",
+                "Equal"
             ],
             "weight_type": "QInt8"
         }

tokenizer.json CHANGED Viewed

@@ -9,7 +9,7 @@
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
-      "normalized": true,
       "special": true
     },
     {
@@ -18,7 +18,7 @@
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
-      "normalized": true,
       "special": true
     },
     {
@@ -27,7 +27,7 @@
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
-      "normalized": true,
       "special": true
     }
   ],

       "single_word": false,
       "lstrip": false,
       "rstrip": false,
+      "normalized": false,
       "special": true
     },
     {
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
+      "normalized": false,
       "special": true
     },
     {
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
+      "normalized": false,
       "special": true
     }
   ],