Xenova HF staff commited on
Commit
f5c922d
1 Parent(s): 6014ea3

Upload folder using huggingface_hub

Browse files
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67abb2f72a3abfb8891293e49fb64600aa08185ae42dd46a9a5e19a06760a190
3
+ size 16175490
onnx/model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a52bccc85c1004aabf961745099294f80971bc7f22485bf2f728fa262ec8581
3
+ size 16175509
onnx/model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c9cbbe3ec9ee0bd3a866514c1c8d089415b5b31d4e8072dceca85def5aa276b
3
+ size 8160627
onnx/model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a65eba5213ad021082d16c12141ec6a8e99963f14ecc0c094bb2dd3996c6e985
3
+ size 4370559
onnx/model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a52bccc85c1004aabf961745099294f80971bc7f22485bf2f728fa262ec8581
3
+ size 16175509
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b84125140b1c9752bb85f49171bcea9039d55fda5d2b21d2cb3d5dd41024ac45
3
+ size 4370597
onnx/model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b84125140b1c9752bb85f49171bcea9039d55fda5d2b21d2cb3d5dd41024ac45
3
+ size 4370597
quantize_config.json ADDED
@@ -0,0 +1,90 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fp16": {},
3
+ "q8": {
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Add",
8
+ "BatchNormalization",
9
+ "Constant",
10
+ "Conv",
11
+ "Div",
12
+ "Erf",
13
+ "Flatten",
14
+ "Gemm",
15
+ "GlobalAveragePool",
16
+ "Identity",
17
+ "Mul",
18
+ "ReduceMean",
19
+ "Relu",
20
+ "Sigmoid",
21
+ "Sub"
22
+ ],
23
+ "weight_type": "QUInt8"
24
+ }
25
+ },
26
+ "per_channel": false,
27
+ "reduce_range": false
28
+ },
29
+ "int8": {
30
+ "per_model_config": {
31
+ "model": {
32
+ "op_types": [
33
+ "Add",
34
+ "BatchNormalization",
35
+ "Constant",
36
+ "Conv",
37
+ "Div",
38
+ "Erf",
39
+ "Flatten",
40
+ "Gemm",
41
+ "GlobalAveragePool",
42
+ "Identity",
43
+ "Mul",
44
+ "ReduceMean",
45
+ "Relu",
46
+ "Sigmoid",
47
+ "Sub"
48
+ ],
49
+ "weight_type": "QInt8"
50
+ }
51
+ },
52
+ "per_channel": false,
53
+ "reduce_range": false
54
+ },
55
+ "uint8": {
56
+ "per_model_config": {
57
+ "model": {
58
+ "op_types": [
59
+ "Add",
60
+ "BatchNormalization",
61
+ "Constant",
62
+ "Conv",
63
+ "Div",
64
+ "Erf",
65
+ "Flatten",
66
+ "Gemm",
67
+ "GlobalAveragePool",
68
+ "Identity",
69
+ "Mul",
70
+ "ReduceMean",
71
+ "Relu",
72
+ "Sigmoid",
73
+ "Sub"
74
+ ],
75
+ "weight_type": "QUInt8"
76
+ }
77
+ },
78
+ "per_channel": false,
79
+ "reduce_range": false
80
+ },
81
+ "q4": {
82
+ "block_size": 32,
83
+ "is_symmetric": true,
84
+ "accuracy_level": null
85
+ },
86
+ "bnb4": {
87
+ "block_size": 64,
88
+ "quant_type": 1
89
+ }
90
+ }