Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +1 -0
generation_config.json +1 -1
onnx/decoder_model.onnx +1 -1
onnx/decoder_model_merged.onnx +1 -1
onnx/decoder_model_merged_quantized.onnx +1 -1
onnx/decoder_model_quantized.onnx +1 -1
onnx/decoder_with_past_model.onnx +1 -1
onnx/decoder_with_past_model_quantized.onnx +1 -1
quantize_config.json +64 -64

config.json CHANGED Viewed

@@ -1,4 +1,5 @@
 {
   "architectures": [
     "LlamaForCausalLM"
   ],

 {
+  "_name_or_path": "Xenova/llama2.c-stories15M",
   "architectures": [
     "LlamaForCausalLM"
   ],

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
-  "transformers_version": "4.33.0.dev0"
 }

   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0fff8a7fe61ffdacec9bfdc7f045bc60ee240c46d63e0c671dabab2a21944c46
 size 97945098

 version https://git-lfs.github.com/spec/v1
+oid sha256:ff5e861cc2ac67ff2ded19ed940b2507ed708612608295fcbf6ecafde8292a0a
 size 97945098

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6816b265a96d80bb85a622c394dc819b269680f327b82ea64f3c77f32117d84e
 size 98260154

 version https://git-lfs.github.com/spec/v1
+oid sha256:6e62780167c73c2596c4a08ff748ce3f3e33fcca0e27e9ba7d83dcbd9c8d5516
 size 98260154

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:473abf17f5284a881ea1086cfead870211b933365a91cead05e2274f94b7d5cb
 size 25279161

 version https://git-lfs.github.com/spec/v1
+oid sha256:ccbf01448c56bf2a96dc640fe8f4a2b018bfea69365a2a972a172144dad400d4
 size 25279161

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:83c62704973668509b573854d3c24d3d47322db722538f0ce6064bc9f425802e
 size 24849487

 version https://git-lfs.github.com/spec/v1
+oid sha256:1fef635548a485428acac2ce40c5de6491a9d73dc2e1192a5a127fd55cd492a4
 size 24849487

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:62dc5b8e6580e7fff028c5bc2993598be53b0d8b28401206a648f3b75517bce8
 size 97945415

 version https://git-lfs.github.com/spec/v1
+oid sha256:83172a6c980948c016f78262097ffa2443c7e4e02ab45b7661bbff65b0886090
 size 97945415

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dafb7a1a57c760eac3203352c6db49456532166dca7ff046bdb5b7127d3eadec
 size 24849120

 version https://git-lfs.github.com/spec/v1
+oid sha256:49d37b90c7c768529f9c643a0543c5bf7d9890f4b1e5c860060ba861beec5e67
 size 24849120

quantize_config.json CHANGED Viewed

@@ -4,102 +4,102 @@
     "per_model_config": {
         "decoder_model": {
             "op_types": [
-                "Squeeze",
-                "Identity",
-                "Constant",
-                "Add",
                 "Pow",
-                "ConstantOfShape",
                 "If",
-                "Reshape",
-                "Sqrt",
-                "Equal",
-                "Where",
                 "Sigmoid",
-                "Sub",
-                "ReduceMean",
-                "Transpose",
                 "Slice",
                 "Neg",
                 "Softmax",
-                "Range",
-                "Shape",
-                "Div",
-                "Gather",
-                "Concat",
                 "Expand",
                 "Cast",
-                "Less",
-                "Unsqueeze",
-                "MatMul",
-                "Mul"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model_merged": {
             "op_types": [
-                "Squeeze",
-                "Identity",
-                "Constant",
-                "Add",
                 "Pow",
-                "ConstantOfShape",
                 "If",
-                "Reshape",
-                "Sqrt",
-                "Equal",
-                "Where",
                 "Sigmoid",
-                "Sub",
-                "ReduceMean",
-                "Transpose",
                 "Slice",
                 "Neg",
                 "Softmax",
-                "Range",
-                "Shape",
-                "Div",
-                "Gather",
-                "Concat",
                 "Expand",
                 "Cast",
-                "Less",
-                "Unsqueeze",
-                "MatMul",
-                "Mul"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_with_past_model": {
             "op_types": [
-                "Squeeze",
-                "Identity",
-                "Constant",
-                "Add",
                 "Pow",
-                "ConstantOfShape",
                 "If",
-                "Reshape",
-                "Sqrt",
-                "Where",
-                "Equal",
                 "Sigmoid",
-                "Sub",
-                "ReduceMean",
-                "Transpose",
                 "Slice",
                 "Neg",
                 "Softmax",
-                "Range",
-                "Shape",
-                "Div",
-                "Gather",
-                "Concat",
                 "Expand",
                 "Cast",
-                "Unsqueeze",
-                "MatMul",
-                "Mul"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "decoder_model": {
             "op_types": [
+                "Range",
+                "Reshape",
                 "Pow",
+                "Div",
+                "Add",
+                "ReduceMean",
                 "If",
                 "Sigmoid",
+                "Less",
+                "Sqrt",
+                "Squeeze",
+                "Gather",
+                "Constant",
                 "Slice",
+                "Shape",
+                "Identity",
                 "Neg",
+                "Transpose",
+                "Where",
                 "Softmax",
+                "Unsqueeze",
                 "Expand",
+                "Equal",
                 "Cast",
+                "Concat",
+                "Mul",
+                "Sub",
+                "ConstantOfShape",
+                "MatMul"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_with_past_model": {
             "op_types": [
+                "Range",
+                "Reshape",
                 "Pow",
+                "Div",
+                "Add",
+                "ReduceMean",
                 "If",
                 "Sigmoid",
+                "Sqrt",
+                "Squeeze",
+                "Gather",
+                "Constant",
                 "Slice",
+                "Shape",
+                "Identity",
                 "Neg",
+                "Transpose",
+                "Where",
                 "Softmax",
+                "Unsqueeze",
                 "Expand",
+                "Equal",
                 "Cast",
+                "Concat",
+                "Mul",
+                "Sub",
+                "ConstantOfShape",
+                "MatMul"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Range",
+                "Reshape",
                 "Pow",
+                "Div",
+                "Add",
+                "ReduceMean",
                 "If",
                 "Sigmoid",
+                "Less",
+                "Sqrt",
+                "Squeeze",
+                "Gather",
+                "Constant",
                 "Slice",
+                "Shape",
+                "Identity",
                 "Neg",
+                "Transpose",
+                "Where",
                 "Softmax",
+                "Unsqueeze",
                 "Expand",
+                "Equal",
                 "Cast",
+                "Concat",
+                "Mul",
+                "Sub",
+                "ConstantOfShape",
+                "MatMul"
             ],
             "weight_type": "QInt8"
         }