Xenova HF staff commited on
Commit
69b9d6c
1 Parent(s): 5702823

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ onnx/embed_tokens_bnb4.onnx_data filter=lfs diff=lfs merge=lfs -text
37
+ onnx/embed_tokens_q4.onnx_data filter=lfs diff=lfs merge=lfs -text
38
+ onnx/model.onnx_data filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "text-model",
3
+ "architectures": [
4
+ "GemmaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 2,
9
+ "eos_token_id": 1,
10
+ "head_dim": 256,
11
+ "hidden_act": "gelu_pytorch_tanh",
12
+ "hidden_activation": "gelu_pytorch_tanh",
13
+ "hidden_size": 2048,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 16384,
16
+ "max_position_embeddings": 8192,
17
+ "model_type": "gemma",
18
+ "num_attention_heads": 8,
19
+ "num_hidden_layers": 18,
20
+ "num_image_tokens": 256,
21
+ "num_key_value_heads": 1,
22
+ "pad_token_id": 0,
23
+ "rms_norm_eps": 1e-06,
24
+ "rope_theta": 10000.0,
25
+ "transformers_version": "4.42.0.dev0",
26
+ "use_cache": true,
27
+ "vocab_size": 257216
28
+ }
generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 2,
4
+ "eos_token_id": 1,
5
+ "pad_token_id": 0,
6
+ "transformers_version": "4.42.0.dev0"
7
+ }
onnx/embed_tokens.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc96fb25a0aec82650b39f01e41689c4b9711c48b3f57bf1a9de41803dedc92e
3
+ size 2107113711
onnx/embed_tokens_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0acc862f7b9691dce35b0273160da94eecfe18d2a6f2425526f079f939b54489
3
+ size 323
onnx/embed_tokens_bnb4.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a68f638671117974950a159fb13edeefdf3cf4147494a7dbaf36f40c69142c0
3
+ size 2107113472
onnx/embed_tokens_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:699140886342b5ba4fc9f56c7111dcb4e515ba19f4ed481777f9a9511a9398ab
3
+ size 1053557125
onnx/embed_tokens_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47001732d5cf1d6e7386eb2fd28f286a332ecce183d13473cea167c8f2491055
3
+ size 526778852
onnx/embed_tokens_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5de3e4630ae834f6979223f29db682a8a1de626e66591d9720d098be47c0199a
3
+ size 321
onnx/embed_tokens_q4.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a68f638671117974950a159fb13edeefdf3cf4147494a7dbaf36f40c69142c0
3
+ size 2107113472
onnx/embed_tokens_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47001732d5cf1d6e7386eb2fd28f286a332ecce183d13473cea167c8f2491055
3
+ size 526778852
onnx/embed_tokens_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b6ce4ace76acec6ba30f5f3486546758a271a925d87d17561ed3553e6a360e0
3
+ size 526778852
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa96d4b54700da860700ddec4ee5f4a6a042085259f3131bf654a3c312ef410a
3
+ size 864982
onnx/model.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad7f69325a22da08811c520686930b51fd84ea240b092b785f42cd2ae077e74e
3
+ size 10034651136
onnx/model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dbd4ead7db525d3fb0dbaf704abc11adffaefac35b33c87934f810639162fb7
3
+ size 1569043569
onnx/vision_encoder.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28ab5c10712d0258f21f75093d4e6c47f97df5d362027d6c08af7a9b57fe9e0f
3
+ size 1659889692
onnx/vision_encoder_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d0d0b303249137dd1aa5ae6e61973c984bcca57f0f2648b5371d99dfcef0cf5
3
+ size 238750500
onnx/vision_encoder_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b7977ff5234fa95849d6e87237b81a71121f9351b6bca212f2d0d36632b4918
3
+ size 830494512
onnx/vision_encoder_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbca09516ac12dd17c332a9c554fdba30f38b67c4d167ca7dbdba4ed29c09550
3
+ size 417144008
onnx/vision_encoder_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcb975c7b3fcef3884cd4f280a07e4d5aa37628c5574a0cb3139003ad4cb158c
3
+ size 264899569
onnx/vision_encoder_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b545abe09f4174fd05192f93cfc0ad97948305bbad0fd8021ea8b212e009b1fc
3
+ size 417144094
onnx/vision_encoder_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b545abe09f4174fd05192f93cfc0ad97948305bbad0fd8021ea8b212e009b1fc
3
+ size 417144094
quantize_config.json ADDED
@@ -0,0 +1,123 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fp16": {},
3
+ "q8": {
4
+ "per_model_config": {
5
+ "embed_tokens": {
6
+ "op_types": [
7
+ "Gather"
8
+ ],
9
+ "weight_type": "QInt8"
10
+ },
11
+ "vision_encoder": {
12
+ "op_types": [
13
+ "Add",
14
+ "Cast",
15
+ "Concat",
16
+ "Constant",
17
+ "Conv",
18
+ "Div",
19
+ "Gather",
20
+ "MatMul",
21
+ "Mul",
22
+ "Pow",
23
+ "ReduceMean",
24
+ "Reshape",
25
+ "Shape",
26
+ "Slice",
27
+ "Softmax",
28
+ "Sqrt",
29
+ "Sub",
30
+ "Tanh",
31
+ "Transpose",
32
+ "Unsqueeze"
33
+ ],
34
+ "weight_type": "QUInt8"
35
+ }
36
+ },
37
+ "per_channel": false,
38
+ "reduce_range": false
39
+ },
40
+ "int8": {
41
+ "per_model_config": {
42
+ "embed_tokens": {
43
+ "op_types": [
44
+ "Gather"
45
+ ],
46
+ "weight_type": "QInt8"
47
+ },
48
+ "vision_encoder": {
49
+ "op_types": [
50
+ "Add",
51
+ "Cast",
52
+ "Concat",
53
+ "Constant",
54
+ "Conv",
55
+ "Div",
56
+ "Gather",
57
+ "MatMul",
58
+ "Mul",
59
+ "Pow",
60
+ "ReduceMean",
61
+ "Reshape",
62
+ "Shape",
63
+ "Slice",
64
+ "Softmax",
65
+ "Sqrt",
66
+ "Sub",
67
+ "Tanh",
68
+ "Transpose",
69
+ "Unsqueeze"
70
+ ],
71
+ "weight_type": "QInt8"
72
+ }
73
+ },
74
+ "per_channel": false,
75
+ "reduce_range": false
76
+ },
77
+ "uint8": {
78
+ "per_model_config": {
79
+ "embed_tokens": {
80
+ "op_types": [
81
+ "Gather"
82
+ ],
83
+ "weight_type": "QUInt8"
84
+ },
85
+ "vision_encoder": {
86
+ "op_types": [
87
+ "Add",
88
+ "Cast",
89
+ "Concat",
90
+ "Constant",
91
+ "Conv",
92
+ "Div",
93
+ "Gather",
94
+ "MatMul",
95
+ "Mul",
96
+ "Pow",
97
+ "ReduceMean",
98
+ "Reshape",
99
+ "Shape",
100
+ "Slice",
101
+ "Softmax",
102
+ "Sqrt",
103
+ "Sub",
104
+ "Tanh",
105
+ "Transpose",
106
+ "Unsqueeze"
107
+ ],
108
+ "weight_type": "QUInt8"
109
+ }
110
+ },
111
+ "per_channel": false,
112
+ "reduce_range": false
113
+ },
114
+ "q4": {
115
+ "block_size": 32,
116
+ "is_symmetric": true,
117
+ "accuracy_level": null
118
+ },
119
+ "bnb4": {
120
+ "block_size": 64,
121
+ "quant_type": 1
122
+ }
123
+ }