nanmoon commited on
Commit
a1cd40b
1 Parent(s): 451df26

onnx model

Browse files
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69ed3f810d3b6d13f70dff9ca89966f39c0a0e877fb88211be7bcc070df2a2ce
3
+ size 1336854281
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4842b56e233be1cc74770f57f63b1ebb6cf357cca3dd73fcdec35c019f8a5d6e
3
+ size 336983162
quantize_config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Reshape",
8
+ "Pow",
9
+ "Slice",
10
+ "Transpose",
11
+ "Mul",
12
+ "Sub",
13
+ "Add",
14
+ "Concat",
15
+ "Unsqueeze",
16
+ "ReduceMean",
17
+ "Constant",
18
+ "Gather",
19
+ "Softmax",
20
+ "Sqrt",
21
+ "Cast",
22
+ "Div",
23
+ "Shape",
24
+ "Erf",
25
+ "MatMul"
26
+ ],
27
+ "weight_type": "QInt8"
28
+ }
29
+ }
30
+ }