steerapi commited on
Commit
8d2a77c
1 Parent(s): bd15347

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -45,3 +45,4 @@ onnx/q1/decoder_model_merged_quantized.onnx.data filter=lfs diff=lfs merge=lfs -
45
  onnx/decoder_model_merged_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
46
  onnx/decoder_model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
47
  onnx/decoder_with_past_model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
 
 
45
  onnx/decoder_model_merged_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
46
  onnx/decoder_model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
47
  onnx/decoder_with_past_model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
48
+ onnx/decoder_model_merged_quantized.onnx_data filter=lfs diff=lfs merge=lfs -text
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:289772dc7b8a483e82ca0232aab62d166923f9ffe916109e9dd73d16f5c95525
3
- size 12084802
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:210c6485f34cc1c35daa38072b29cb540c7dc7c04326cfd5b81c1429368398e3
3
+ size 19045741
onnx/decoder_model_merged_quantized.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d312201a36ec7d97cac2fc87c664ef0ec16a681f55ec013b9e3ce383904411e4
3
+ size 6739214336
onnx/quantize_config.json CHANGED
@@ -1,39 +1,39 @@
1
  {
2
- "per_channel": false,
3
- "reduce_range": false,
4
  "use_external_data_format": true,
5
  "per_model_config": {
6
  "decoder_model_merged": {
7
  "op_types": [
8
- "Cast",
9
- "Sigmoid",
 
10
  "If",
11
  "Shape",
12
- "Gather",
13
- "Squeeze",
14
- "Pow",
15
  "Sub",
16
- "Identity",
17
- "Unsqueeze",
18
- "MatMul",
19
- "ReduceMean",
20
- "Constant",
21
  "Equal",
22
- "Sqrt",
23
- "Expand",
24
  "Add",
25
- "Range",
26
- "Less",
 
27
  "Div",
28
- "ConstantOfShape",
 
 
 
 
29
  "Where",
30
- "Transpose",
31
  "Mul",
32
- "Slice",
33
- "Softmax",
34
- "Neg",
35
- "Concat",
36
- "Reshape"
37
  ],
38
  "weight_type": "QInt8"
39
  }
 
1
  {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
  "use_external_data_format": true,
5
  "per_model_config": {
6
  "decoder_model_merged": {
7
  "op_types": [
8
+ "Slice",
9
+ "Sqrt",
10
+ "Less",
11
  "If",
12
  "Shape",
13
+ "Transpose",
14
+ "Range",
 
15
  "Sub",
16
+ "Concat",
17
+ "Squeeze",
18
+ "Cast",
19
+ "Neg",
 
20
  "Equal",
 
 
21
  "Add",
22
+ "Pow",
23
+ "Reshape",
24
+ "Identity",
25
  "Div",
26
+ "Constant",
27
+ "Gather",
28
+ "Softmax",
29
+ "Sigmoid",
30
+ "ReduceMean",
31
  "Where",
 
32
  "Mul",
33
+ "Expand",
34
+ "MatMul",
35
+ "Unsqueeze",
36
+ "ConstantOfShape"
 
37
  ],
38
  "weight_type": "QInt8"
39
  }