Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +1 -0
generation_config.json +1 -1
onnx/decoder_model.onnx +1 -1
onnx/decoder_model_merged.onnx +1 -1
onnx/decoder_model_merged_quantized.onnx +1 -1
onnx/decoder_model_quantized.onnx +1 -1
onnx/decoder_with_past_model.onnx +1 -1
onnx/decoder_with_past_model_quantized.onnx +1 -1
quantize_config.json +64 -64

config.json CHANGED Viewed

@@ -1,4 +1,5 @@
 {
   "architectures": [
     "LlamaForCausalLM"
   ],

 {
+  "_name_or_path": "Xenova/llama2.c-stories42M",
   "architectures": [
     "LlamaForCausalLM"
   ],

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
-  "transformers_version": "4.33.0.dev0"
 }

   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e54c6f935c3f8cbe2c9eaf180f1cd18f3314d512261e3d9ffff8ccf4f7e0affd
 size 233102386

 version https://git-lfs.github.com/spec/v1
+oid sha256:57fecedae457d1811cd12abe22589f313aa15c1590e1e09bae3408052e6a74c7
 size 233102386

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:680d2348fa9388e61979d8461735ad105d27e49bedb1601e6b25cd813ac38627
 size 233913496

 version https://git-lfs.github.com/spec/v1
+oid sha256:46464ab95c2c94ad1e493d0ca7746763f367343fce80cdcf7d0036911947564c
 size 233913496

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ecebda7e52b45e63820aba9fda9d9b285bff82c73c80f4ae828f3b6fd589e1de
 size 60022789

 version https://git-lfs.github.com/spec/v1
+oid sha256:afb16b73d5c4f6e825abedc3ce65298ecd567e29c75dc98cc7f7b8dbf9e00074
 size 60022789

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d2127d1570779e6856453779104ef0fcf3115d10499e9a3d735cf8192f734c68
 size 59060350

 version https://git-lfs.github.com/spec/v1
+oid sha256:ea09156167b318bfb6149e325a18c79e95e0948175dd3fb496da53ca0589f070
 size 59060350

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f8337fdaae31edbf83ef8477c49374f4d7fba83cb72a3c335546ac85e73d5c82
 size 233104923

 version https://git-lfs.github.com/spec/v1
+oid sha256:47d1d207d61288f734b55448c70e5b344262c01087900f6c258b7805e0ed86a9
 size 233104923

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7feaf947dbef1d8a837620946880a29c64fae88b156d62434b785ead3e7c797a
 size 59062863

 version https://git-lfs.github.com/spec/v1
+oid sha256:ca6889c5883f8686fd4ba12ee26e025b490d7ffcbe1408c8b92f766e3df6f199
 size 59062863

quantize_config.json CHANGED Viewed

@@ -4,102 +4,102 @@
     "per_model_config": {
         "decoder_model": {
             "op_types": [
-                "Unsqueeze",
-                "Concat",
-                "Cast",
-                "Identity",
-                "Div",
-                "Shape",
                 "Softmax",
-                "MatMul",
-                "ConstantOfShape",
                 "If",
-                "Add",
                 "Mul",
-                "Less",
                 "Slice",
-                "Constant",
                 "Range",
-                "Sub",
-                "Expand",
-                "Pow",
                 "Sigmoid",
                 "Where",
-                "Gather",
-                "Neg",
                 "Squeeze",
-                "Equal",
-                "ReduceMean",
-                "Reshape",
-                "Sqrt",
-                "Transpose"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model_merged": {
             "op_types": [
-                "Unsqueeze",
-                "Concat",
-                "Cast",
-                "Identity",
-                "Div",
-                "Shape",
                 "Softmax",
-                "MatMul",
-                "ConstantOfShape",
                 "If",
-                "Add",
                 "Mul",
-                "Less",
                 "Slice",
-                "Constant",
                 "Range",
-                "Sub",
-                "Expand",
-                "Pow",
                 "Sigmoid",
                 "Where",
-                "Gather",
-                "Neg",
                 "Squeeze",
-                "Equal",
-                "ReduceMean",
-                "Reshape",
-                "Sqrt",
-                "Transpose"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_with_past_model": {
             "op_types": [
-                "Unsqueeze",
-                "Concat",
-                "Cast",
-                "Identity",
-                "Div",
-                "Shape",
                 "Softmax",
-                "MatMul",
-                "ConstantOfShape",
                 "If",
-                "Add",
                 "Mul",
                 "Slice",
-                "Constant",
                 "Range",
-                "Sub",
-                "Expand",
-                "Pow",
                 "Sigmoid",
                 "Where",
-                "Gather",
-                "Neg",
                 "Squeeze",
-                "Equal",
-                "ReduceMean",
-                "Reshape",
-                "Sqrt",
-                "Transpose"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "decoder_model": {
             "op_types": [
+                "Sub",
                 "Softmax",
+                "Neg",
+                "Sqrt",
+                "Reshape",
                 "If",
+                "Shape",
+                "Transpose",
+                "Pow",
                 "Mul",
+                "MatMul",
+                "Gather",
                 "Slice",
+                "Less",
+                "ReduceMean",
+                "Concat",
                 "Range",
+                "Unsqueeze",
+                "Equal",
+                "Cast",
+                "ConstantOfShape",
+                "Add",
                 "Sigmoid",
                 "Where",
                 "Squeeze",
+                "Constant",
+                "Identity",
+                "Div",
+                "Expand"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_with_past_model": {
             "op_types": [
+                "Sub",
                 "Softmax",
+                "Neg",
+                "Sqrt",
+                "Reshape",
                 "If",
+                "Shape",
+                "Transpose",
+                "Pow",
                 "Mul",
+                "MatMul",
+                "Gather",
                 "Slice",
+                "ReduceMean",
+                "Concat",
                 "Range",
+                "Unsqueeze",
+                "Equal",
+                "Cast",
+                "ConstantOfShape",
+                "Add",
                 "Sigmoid",
                 "Where",
                 "Squeeze",
+                "Constant",
+                "Identity",
+                "Div",
+                "Expand"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Sub",
                 "Softmax",
+                "Neg",
+                "Sqrt",
+                "Reshape",
                 "If",
+                "Shape",
+                "Transpose",
+                "Pow",
                 "Mul",
+                "MatMul",
+                "Gather",
                 "Slice",
+                "Less",
+                "ReduceMean",
+                "Concat",
                 "Range",
+                "Unsqueeze",
+                "Equal",
+                "Cast",
+                "ConstantOfShape",
+                "Add",
                 "Sigmoid",
                 "Where",
                 "Squeeze",
+                "Constant",
+                "Identity",
+                "Div",
+                "Expand"
             ],
             "weight_type": "QInt8"
         }