Upload folder using huggingface_hub

#4
by Xenova HF staff - opened
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "google/gemma-7b-it",
3
  "architectures": [
4
  "GemmaForCausalLM"
5
  ],
@@ -9,6 +9,7 @@
9
  "eos_token_id": 1,
10
  "head_dim": 2,
11
  "hidden_act": "gelu",
 
12
  "hidden_size": 8,
13
  "initializer_range": 0.02,
14
  "intermediate_size": 16,
@@ -21,8 +22,7 @@
21
  "rms_norm_eps": 1e-06,
22
  "rope_scaling": null,
23
  "rope_theta": 10000.0,
24
- "torch_dtype": "float32",
25
- "transformers_version": "4.38.1",
26
  "use_cache": true,
27
  "vocab_size": 256000
28
  }
 
1
  {
2
+ "_name_or_path": "Xenova/tiny-random-GemmaForCausalLM",
3
  "architectures": [
4
  "GemmaForCausalLM"
5
  ],
 
9
  "eos_token_id": 1,
10
  "head_dim": 2,
11
  "hidden_act": "gelu",
12
+ "hidden_activation": "gelu_pytorch_tanh",
13
  "hidden_size": 8,
14
  "initializer_range": 0.02,
15
  "intermediate_size": 16,
 
22
  "rms_norm_eps": 1e-06,
23
  "rope_scaling": null,
24
  "rope_theta": 10000.0,
25
+ "transformers_version": "4.42.0.dev0",
 
26
  "use_cache": true,
27
  "vocab_size": 256000
28
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "bos_token_id": 2,
4
  "eos_token_id": 1,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.38.1"
7
  }
 
3
  "bos_token_id": 2,
4
  "eos_token_id": 1,
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.42.0.dev0"
7
  }
onnx/model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea87779ee6e68454bd7f3cde0c2f8fb891f9529f2f56d511982be2d92e7f5007
3
- size 75410798
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba2690dc6dccb2393d7c1d6e456444b4fa0ee0f166dd372e0df06fab250b054f
3
+ size 8304714
onnx/model_bnb4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bce66ef1fd853191e102bad41e1b29dbbb31ea78a5eccdf0d4bf29e0ff59bcdc
3
- size 75408909
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ef59b214123dfc30d8a933cece7a73e585a28ea08b32b133ed93b54afd3ad67
3
+ size 8302825
onnx/model_fp16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d21c72a0226346ad38834d26c991dad3d1ea773971b97fc07c22c94f6932ebf
3
- size 71357852
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bb98884b766db6f6f30c860a60b77c204eb5348b02ebb3daf1ea49786625f6b
3
+ size 4254070
onnx/model_int8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15ccaf18b573045e6fe591f4f766c5bc0d988735972801d04414c0b25e2cd6dc
3
- size 69323622
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dec01b08412c43540eb9d96c979828c2295442946a2a6ae3ab04c0a7a2215900
3
+ size 2219842
onnx/model_q4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51b2cb87f0dfaba5874151dba68ce9dfc114da33291f65ab7ddb62e6be29154c
3
- size 75410735
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2844d53f01272ea5db79b0edd6fd50fe64d4f4d01361d16dfa859e142cc9f9df
3
+ size 8304651
onnx/model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15ccaf18b573045e6fe591f4f766c5bc0d988735972801d04414c0b25e2cd6dc
3
- size 69323622
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dec01b08412c43540eb9d96c979828c2295442946a2a6ae3ab04c0a7a2215900
3
+ size 2219842
onnx/model_uint8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a80107bb992dcf56fd591e11204c91bac83a3c2a02d54d9da9aad7710bc3f86f
3
- size 69323621
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a7ccd538c06cc6b615b30023b45926052696481ebfc0bc020e8d499a65f87dd
3
+ size 2219841
quantize_config.json ADDED
@@ -0,0 +1,135 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fp16": {},
3
+ "q8": {
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Add",
8
+ "Cast",
9
+ "Concat",
10
+ "Constant",
11
+ "ConstantOfShape",
12
+ "Cos",
13
+ "Div",
14
+ "Equal",
15
+ "Expand",
16
+ "Gather",
17
+ "Greater",
18
+ "Identity",
19
+ "MatMul",
20
+ "Mul",
21
+ "Neg",
22
+ "Pow",
23
+ "Range",
24
+ "ReduceMean",
25
+ "Reshape",
26
+ "ScatterND",
27
+ "Shape",
28
+ "Sin",
29
+ "Slice",
30
+ "Softmax",
31
+ "Sqrt",
32
+ "Tanh",
33
+ "Transpose",
34
+ "Trilu",
35
+ "Unsqueeze",
36
+ "Where"
37
+ ],
38
+ "weight_type": "QInt8"
39
+ }
40
+ },
41
+ "per_channel": true,
42
+ "reduce_range": true
43
+ },
44
+ "int8": {
45
+ "per_model_config": {
46
+ "model": {
47
+ "op_types": [
48
+ "Add",
49
+ "Cast",
50
+ "Concat",
51
+ "Constant",
52
+ "ConstantOfShape",
53
+ "Cos",
54
+ "Div",
55
+ "Equal",
56
+ "Expand",
57
+ "Gather",
58
+ "Greater",
59
+ "Identity",
60
+ "MatMul",
61
+ "Mul",
62
+ "Neg",
63
+ "Pow",
64
+ "Range",
65
+ "ReduceMean",
66
+ "Reshape",
67
+ "ScatterND",
68
+ "Shape",
69
+ "Sin",
70
+ "Slice",
71
+ "Softmax",
72
+ "Sqrt",
73
+ "Tanh",
74
+ "Transpose",
75
+ "Trilu",
76
+ "Unsqueeze",
77
+ "Where"
78
+ ],
79
+ "weight_type": "QInt8"
80
+ }
81
+ },
82
+ "per_channel": true,
83
+ "reduce_range": true
84
+ },
85
+ "uint8": {
86
+ "per_model_config": {
87
+ "model": {
88
+ "op_types": [
89
+ "Add",
90
+ "Cast",
91
+ "Concat",
92
+ "Constant",
93
+ "ConstantOfShape",
94
+ "Cos",
95
+ "Div",
96
+ "Equal",
97
+ "Expand",
98
+ "Gather",
99
+ "Greater",
100
+ "Identity",
101
+ "MatMul",
102
+ "Mul",
103
+ "Neg",
104
+ "Pow",
105
+ "Range",
106
+ "ReduceMean",
107
+ "Reshape",
108
+ "ScatterND",
109
+ "Shape",
110
+ "Sin",
111
+ "Slice",
112
+ "Softmax",
113
+ "Sqrt",
114
+ "Tanh",
115
+ "Transpose",
116
+ "Trilu",
117
+ "Unsqueeze",
118
+ "Where"
119
+ ],
120
+ "weight_type": "QUInt8"
121
+ }
122
+ },
123
+ "per_channel": true,
124
+ "reduce_range": true
125
+ },
126
+ "q4": {
127
+ "block_size": 32,
128
+ "is_symmetric": true,
129
+ "accuracy_level": null
130
+ },
131
+ "bnb4": {
132
+ "block_size": 64,
133
+ "quant_type": 1
134
+ }
135
+ }
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:05e97791a5e007260de1db7e1692e53150e08cea481e2bf25435553380c147ee
3
- size 17477929
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17a91ce4908a747435938ec27fe0f811551fdc89a64222b539f8de528b7fd81b
3
+ size 17477957