Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +1 -0
generation_config.json +1 -1
onnx/decoder_model.onnx +1 -1
onnx/decoder_model_merged.onnx +1 -1
onnx/decoder_model_merged_quantized.onnx +1 -1
onnx/decoder_model_quantized.onnx +1 -1
onnx/decoder_with_past_model.onnx +1 -1
onnx/decoder_with_past_model_quantized.onnx +1 -1
quantize_config.json +70 -70

config.json CHANGED Viewed

@@ -1,4 +1,5 @@
 {
   "architectures": [
     "LlamaForCausalLM"
   ],

 {
+  "_name_or_path": "Xenova/llama2.c-stories110M",
   "architectures": [
     "LlamaForCausalLM"
   ],

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
-  "transformers_version": "4.33.0.dev0"
 }

   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a5e2b243114cc61be8bf88035c2ad85b879a298177bdb31c98582e4d8e8fa222
 size 537368189

 version https://git-lfs.github.com/spec/v1
+oid sha256:518f877e2dccc56ad030d9720872f2ac692b61835e31e116ffb285582384c623
 size 537368189

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c076e620480ce241d3a15e5271e6f7852d804190b0d52673449d5b9cf80052d7
 size 538320735

 version https://git-lfs.github.com/spec/v1
+oid sha256:d591ab765b32cfefa5586ac7a7b5577240195902b70e39c903d9bac4f1acd4b0
 size 538320735

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:33696a9f854ce32f34b0ec1bf033379514bf427258b6747eafb2da6e1798ccf2
 size 136511989

 version https://git-lfs.github.com/spec/v1
+oid sha256:a4fb65533cebf47090f460b15dfadf306db447e9ec5bcf3735f6299e59a020ea
 size 136511989

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:969bc1893a6b71eeaaea45821666ff947e6260c867cb1da06e47cb6728f28948
 size 135334125

 version https://git-lfs.github.com/spec/v1
+oid sha256:1ca251aacafd0bc97b73272fa713f888b84507269c83a85420f17af2fa595bd5
 size 135334125

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e8a33b0ab5193433d1ed4660a27337421bbbfdf28f1ad92517dfa7c772a5b0f
 size 537375208

 version https://git-lfs.github.com/spec/v1
+oid sha256:6b700555c3d04fa980bd6a55518ed2474f47e7bd9dfb60ace122e9d61694a471
 size 537375208

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8fef387f70bb057d890c11585f1950c9bd5c633e60afa0ce380b1389cca267a9
 size 135342446

 version https://git-lfs.github.com/spec/v1
+oid sha256:405c4a5918d015b814a8e94f4c19c31c6eee15579e71c9b23dd25bcaef48d75c
 size 135342446

quantize_config.json CHANGED Viewed

@@ -4,102 +4,102 @@
     "per_model_config": {
         "decoder_model": {
             "op_types": [
-                "Unsqueeze",
-                "Sub",
-                "Sigmoid",
-                "If",
-                "Shape",
-                "Transpose",
-                "Slice",
-                "ReduceMean",
                 "Concat",
-                "Reshape",
-                "Range",
-                "Mul",
-                "Identity",
                 "Softmax",
                 "Pow",
-                "Add",
-                "Div",
                 "Equal",
-                "Neg",
-                "Constant",
-                "MatMul",
-                "ConstantOfShape",
                 "Gather",
-                "Where",
                 "Squeeze",
-                "Cast",
-                "Less",
-                "Expand",
-                "Sqrt"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model_merged": {
             "op_types": [
-                "Unsqueeze",
-                "Sub",
-                "Sigmoid",
-                "If",
-                "Shape",
-                "Transpose",
-                "Slice",
-                "ReduceMean",
                 "Concat",
-                "Reshape",
-                "Range",
-                "Mul",
-                "Identity",
                 "Softmax",
                 "Pow",
-                "Add",
-                "Div",
                 "Equal",
-                "Neg",
-                "Constant",
-                "MatMul",
-                "ConstantOfShape",
                 "Gather",
-                "Where",
                 "Squeeze",
-                "Cast",
-                "Less",
-                "Expand",
-                "Sqrt"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_with_past_model": {
             "op_types": [
-                "Unsqueeze",
-                "Sub",
-                "Sigmoid",
-                "If",
-                "Shape",
-                "Transpose",
-                "Slice",
-                "ReduceMean",
                 "Concat",
-                "Reshape",
-                "Mul",
-                "Identity",
                 "Softmax",
                 "Pow",
-                "Add",
-                "Div",
                 "Equal",
-                "Neg",
-                "Constant",
-                "MatMul",
-                "ConstantOfShape",
                 "Gather",
-                "Where",
-                "Squeeze",
-                "Cast",
                 "Range",
-                "Expand",
-                "Sqrt"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "decoder_model": {
             "op_types": [
                 "Concat",
+                "Where",
+                "Less",
+                "ConstantOfShape",
+                "Neg",
+                "Sqrt",
+                "Div",
                 "Softmax",
+                "MatMul",
+                "Slice",
+                "Reshape",
+                "Shape",
                 "Pow",
+                "Cast",
                 "Equal",
+                "Add",
+                "Expand",
+                "Mul",
+                "Sub",
                 "Gather",
+                "Identity",
+                "Range",
+                "Transpose",
+                "Constant",
                 "Squeeze",
+                "If",
+                "ReduceMean",
+                "Sigmoid",
+                "Unsqueeze"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_with_past_model": {
             "op_types": [
                 "Concat",
+                "Where",
+                "ConstantOfShape",
+                "Neg",
+                "Sqrt",
+                "Div",
                 "Softmax",
+                "MatMul",
+                "Slice",
+                "Reshape",
+                "Shape",
                 "Pow",
+                "Cast",
                 "Equal",
+                "Add",
+                "Expand",
+                "Mul",
+                "Sub",
                 "Gather",
+                "Identity",
+                "Range",
+                "Transpose",
+                "Constant",
                 "Squeeze",
+                "If",
+                "ReduceMean",
+                "Sigmoid",
+                "Unsqueeze"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
                 "Concat",
+                "Where",
+                "Less",
+                "ConstantOfShape",
+                "Neg",
+                "Sqrt",
+                "Div",
                 "Softmax",
+                "MatMul",
+                "Slice",
+                "Reshape",
+                "Shape",
                 "Pow",
+                "Cast",
                 "Equal",
+                "Add",
+                "Expand",
+                "Mul",
+                "Sub",
                 "Gather",
+                "Identity",
                 "Range",
+                "Transpose",
+                "Constant",
+                "Squeeze",
+                "If",
+                "ReduceMean",
+                "Sigmoid",
+                "Unsqueeze"
             ],
             "weight_type": "QInt8"
         }