Upload folder using huggingface_hub

Browse files

Files changed (8) hide show

config.json +3 -2
generation_config.json +1 -1
onnx/decoder_model_merged.onnx +1 -1
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +67 -67
tokenizer_config.json +2 -1

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "../llama2.c-stories110M",
   "architectures": [
     "LlamaForCausalLM"
   ],
@@ -17,8 +17,9 @@
   "pretraining_tp": 1,
   "rms_norm_eps": 1e-05,
   "rope_scaling": null,
   "tie_word_embeddings": false,
-  "transformers_version": "4.32.0.dev0",
   "use_cache": true,
   "vocab_size": 32000
 }

 {
+  "_name_or_path": "Xenova/llama2.c-stories110M",
   "architectures": [
     "LlamaForCausalLM"
   ],
   "pretraining_tp": 1,
   "rms_norm_eps": 1e-05,
   "rope_scaling": null,
+  "rope_theta": 10000.0,
   "tie_word_embeddings": false,
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "vocab_size": 32000
 }

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
-  "transformers_version": "4.32.0.dev0"
 }

   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 2,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:868aa85e2ef1c5021cbf43c57a4bab855047f917cf73de5861a27c2992c66fd9
 size 538320735

 version https://git-lfs.github.com/spec/v1
+oid sha256:c076e620480ce241d3a15e5271e6f7852d804190b0d52673449d5b9cf80052d7
 size 538320735

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2526b5fbf36a866575131e95cf2c0a75fe7a03948e32eba5a05c25cdc1814dc2
-size 137148580

 version https://git-lfs.github.com/spec/v1
+oid sha256:33696a9f854ce32f34b0ec1bf033379514bf427258b6747eafb2da6e1798ccf2
+size 136511989

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8e17c1ec579472eab18b12e182816011631dc488f1f03b4da1318300b0e4e43b
-size 135970716

 version https://git-lfs.github.com/spec/v1
+oid sha256:969bc1893a6b71eeaaea45821666ff947e6260c867cb1da06e47cb6728f28948
+size 135334125

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aff8a3d2b8d73fbadbe90c4e86c575a0560b6b9b6fd664a163abde6622aa5209
-size 135979037

 version https://git-lfs.github.com/spec/v1
+oid sha256:8fef387f70bb057d890c11585f1950c9bd5c633e60afa0ce380b1389cca267a9
+size 135342446

quantize_config.json CHANGED Viewed

@@ -1,105 +1,105 @@
 {
-    "per_channel": true,
-    "reduce_range": true,
     "per_model_config": {
-        "decoder_model_merged": {
             "op_types": [
-                "Slice",
-                "Sqrt",
-                "ConstantOfShape",
-                "Softmax",
-                "Sigmoid",
-                "Equal",
-                "Pow",
                 "Unsqueeze",
-                "Concat",
                 "Sub",
-                "Div",
-                "Constant",
-                "Expand",
-                "Cast",
-                "Range",
-                "Reshape",
                 "If",
-                "Where",
                 "Transpose",
-                "Identity",
                 "Mul",
-                "Shape",
                 "Add",
-                "ReduceMean",
                 "MatMul",
-                "Less",
                 "Gather",
-                "Neg",
-                "Squeeze"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_with_past_model": {
             "op_types": [
-                "Slice",
-                "Sqrt",
-                "Squeeze",
-                "Softmax",
-                "Sigmoid",
-                "Equal",
-                "Pow",
                 "Unsqueeze",
-                "Concat",
                 "Sub",
-                "Div",
-                "Constant",
-                "Expand",
-                "Cast",
-                "Range",
-                "Reshape",
-                "Where",
                 "If",
                 "Transpose",
-                "Identity",
                 "Mul",
-                "Shape",
                 "Add",
-                "ReduceMean",
                 "MatMul",
                 "Gather",
-                "Neg",
-                "ConstantOfShape"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model": {
             "op_types": [
-                "Slice",
-                "Sqrt",
-                "ConstantOfShape",
-                "Softmax",
-                "Sigmoid",
-                "Equal",
-                "Pow",
                 "Unsqueeze",
-                "Concat",
                 "Sub",
-                "Div",
-                "Constant",
-                "Expand",
-                "Range",
-                "Cast",
-                "Reshape",
-                "Where",
                 "If",
                 "Transpose",
-                "Identity",
                 "Mul",
-                "Shape",
                 "Add",
-                "ReduceMean",
                 "MatMul",
-                "Less",
                 "Gather",
-                "Neg",
-                "Squeeze"
             ],
             "weight_type": "QInt8"
         }

 {
+    "per_channel": false,
+    "reduce_range": false,
     "per_model_config": {
+        "decoder_model": {
             "op_types": [
                 "Unsqueeze",
                 "Sub",
+                "Sigmoid",
                 "If",
+                "Shape",
                 "Transpose",
+                "Slice",
+                "ReduceMean",
+                "Concat",
+                "Reshape",
+                "Range",
                 "Mul",
+                "Identity",
+                "Softmax",
+                "Pow",
                 "Add",
+                "Div",
+                "Equal",
+                "Neg",
+                "Constant",
                 "MatMul",
+                "ConstantOfShape",
                 "Gather",
+                "Where",
+                "Squeeze",
+                "Cast",
+                "Less",
+                "Expand",
+                "Sqrt"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
                 "Unsqueeze",
                 "Sub",
+                "Sigmoid",
                 "If",
+                "Shape",
                 "Transpose",
+                "Slice",
+                "ReduceMean",
+                "Concat",
+                "Reshape",
+                "Range",
                 "Mul",
+                "Identity",
+                "Softmax",
+                "Pow",
                 "Add",
+                "Div",
+                "Equal",
+                "Neg",
+                "Constant",
                 "MatMul",
+                "ConstantOfShape",
                 "Gather",
+                "Where",
+                "Squeeze",
+                "Cast",
+                "Less",
+                "Expand",
+                "Sqrt"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_with_past_model": {
             "op_types": [
                 "Unsqueeze",
                 "Sub",
+                "Sigmoid",
                 "If",
+                "Shape",
                 "Transpose",
+                "Slice",
+                "ReduceMean",
+                "Concat",
+                "Reshape",
                 "Mul",
+                "Identity",
+                "Softmax",
+                "Pow",
                 "Add",
+                "Div",
+                "Equal",
+                "Neg",
+                "Constant",
                 "MatMul",
+                "ConstantOfShape",
                 "Gather",
+                "Where",
+                "Squeeze",
+                "Cast",
+                "Range",
+                "Expand",
+                "Sqrt"
             ],
             "weight_type": "QInt8"
         }

tokenizer_config.json CHANGED Viewed

@@ -27,5 +27,6 @@
     "normalized": true,
     "rstrip": false,
     "single_word": false
-  }
 }

     "normalized": true,
     "rstrip": false,
     "single_word": false
+  },
+  "use_default_system_prompt": true
 }