Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +100 -0
generation_config.json +6 -0
onnx/model.onnx +3 -0
onnx/model_bnb4.onnx +3 -0
onnx/model_fp16.onnx +3 -0
onnx/model_int8.onnx +3 -0
onnx/model_q4.onnx +3 -0
onnx/model_quantized.onnx +3 -0
onnx/model_uint8.onnx +3 -0
quantize_config.json +132 -0

config.json ADDED Viewed

	@@ -0,0 +1,100 @@

+{
+  "_name_or_path": "apple/OpenELM-450M-Instruct",
+  "activation_fn_name": "swish",
+  "architectures": [
+    "OpenELMForCausalLM"
+  ],
+  "auto_map": {
+    "AutoConfig": "apple/OpenELM-450M-Instruct--configuration_openelm.OpenELMConfig",
+    "AutoModelForCausalLM": "apple/OpenELM-450M-Instruct--modeling_openelm.OpenELMForCausalLM"
+  },
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "ffn_dim_divisor": 256,
+  "ffn_multipliers": [
+    0.5,
+    0.68,
+    0.87,
+    1.05,
+    1.24,
+    1.42,
+    1.61,
+    1.79,
+    1.97,
+    2.16,
+    2.34,
+    2.53,
+    2.71,
+    2.89,
+    3.08,
+    3.26,
+    3.45,
+    3.63,
+    3.82,
+    4.0
+  ],
+  "ffn_with_glu": true,
+  "head_dim": 64,
+  "initializer_range": 0.02,
+  "max_context_length": 2048,
+  "model_dim": 1536,
+  "model_type": "openelm",
+  "normalization_layer_name": "rms_norm",
+  "normalize_qk_projections": true,
+  "num_gqa_groups": 4,
+  "num_kv_heads": [
+    3,
+    3,
+    3,
+    4,
+    4,
+    4,
+    4,
+    4,
+    4,
+    4,
+    5,
+    5,
+    5,
+    5,
+    5,
+    5,
+    6,
+    6,
+    6,
+    6
+  ],
+  "num_query_heads": [
+    12,
+    12,
+    12,
+    16,
+    16,
+    16,
+    16,
+    16,
+    16,
+    16,
+    20,
+    20,
+    20,
+    20,
+    20,
+    20,
+    24,
+    24,
+    24,
+    24
+  ],
+  "num_transformer_layers": 20,
+  "qkv_multipliers": [
+    0.5,
+    1.0
+  ],
+  "rope_freq_constant": 10000,
+  "rope_max_length": 4096,
+  "share_input_output_layers": true,
+  "transformers_version": "4.38.2",
+  "use_cache": true,
+  "vocab_size": 32000
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "transformers_version": "4.38.2"
+}

onnx/model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:70f0b0a1c938f6a379904c5a875bc3db170c67b4db0286b7233d5bcde2afbcdc
+size 2032462018

onnx/model_bnb4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3cf5ad2f548ce6b1189614c21652e2ae8cc3fd7f002a08ee61e9ce13170b0048
+size 461146769

onnx/model_fp16.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:866def23c1fbd676407a229c1027750304622cc7bf736e8821cec8834ca88ab2
+size 1019112984

onnx/model_int8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aa43693120de488220fb7f8c92edddde78448aa6f516d37783a63a5776d7512a
+size 514121019

onnx/model_q4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4f064a5b45c1e3d32d2dc68284ca068056e2acbddb0fa8beb165ddb1807e75fe
+size 489715705

onnx/model_quantized.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aa43693120de488220fb7f8c92edddde78448aa6f516d37783a63a5776d7512a
+size 514121019

onnx/model_uint8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ceebd65902448f1ed7c60fee531ffaad0039f34ad0512abc29e1e4d4aeab9826
+size 514121063

quantize_config.json ADDED Viewed

	@@ -0,0 +1,132 @@

+{
+    "fp16": {},
+    "q8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "And",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "ConstantOfShape",
+                    "Div",
+                    "Equal",
+                    "Expand",
+                    "Gather",
+                    "MatMul",
+                    "Mul",
+                    "Neg",
+                    "Pow",
+                    "Range",
+                    "ReduceMean",
+                    "Reshape",
+                    "ScatterND",
+                    "Shape",
+                    "Sigmoid",
+                    "Slice",
+                    "Softmax",
+                    "Split",
+                    "Sqrt",
+                    "Sub",
+                    "Tile",
+                    "Transpose",
+                    "Unsqueeze",
+                    "Where"
+                ],
+                "weight_type": "QInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "int8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "And",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "ConstantOfShape",
+                    "Div",
+                    "Equal",
+                    "Expand",
+                    "Gather",
+                    "MatMul",
+                    "Mul",
+                    "Neg",
+                    "Pow",
+                    "Range",
+                    "ReduceMean",
+                    "Reshape",
+                    "ScatterND",
+                    "Shape",
+                    "Sigmoid",
+                    "Slice",
+                    "Softmax",
+                    "Split",
+                    "Sqrt",
+                    "Sub",
+                    "Tile",
+                    "Transpose",
+                    "Unsqueeze",
+                    "Where"
+                ],
+                "weight_type": "QInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "uint8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "And",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "ConstantOfShape",
+                    "Div",
+                    "Equal",
+                    "Expand",
+                    "Gather",
+                    "MatMul",
+                    "Mul",
+                    "Neg",
+                    "Pow",
+                    "Range",
+                    "ReduceMean",
+                    "Reshape",
+                    "ScatterND",
+                    "Shape",
+                    "Sigmoid",
+                    "Slice",
+                    "Softmax",
+                    "Split",
+                    "Sqrt",
+                    "Sub",
+                    "Tile",
+                    "Transpose",
+                    "Unsqueeze",
+                    "Where"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "q4": {
+        "block_size": 32,
+        "is_symmetric": true,
+        "accuracy_level": null
+    },
+    "bnb4": {
+        "block_size": 64,
+        "quant_type": 1
+    }
+}