JohnDoe70 commited on
Commit
058b3be
1 Parent(s): 95649e3

Add model files

Browse files
Files changed (2) hide show
  1. quantize_config.json +32 -0
  2. tokenizer.json +0 -0
quantize_config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Tanh",
8
+ "Gemm",
9
+ "Shape",
10
+ "Mul",
11
+ "Unsqueeze",
12
+ "Erf",
13
+ "ReduceMean",
14
+ "Sub",
15
+ "Softmax",
16
+ "Constant",
17
+ "Add",
18
+ "MatMul",
19
+ "Div",
20
+ "Sqrt",
21
+ "Concat",
22
+ "Gather",
23
+ "Reshape",
24
+ "Transpose",
25
+ "Pow",
26
+ "Slice",
27
+ "Cast"
28
+ ],
29
+ "weight_type": "QInt8"
30
+ }
31
+ }
32
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff