Xenova HF staff commited on
Commit
e9546e1
1 Parent(s): ec86f4b

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. config.json +1 -1
  2. quantize_config.json +42 -0
config.json CHANGED
@@ -44,7 +44,7 @@
44
  "output_past": false,
45
  "pad_token_id": 1,
46
  "scale_embedding": false,
47
- "transformers_version": "4.29.2",
48
  "use_cache": true,
49
  "vocab_size": 50265
50
  }
 
44
  "output_past": false,
45
  "pad_token_id": 1,
46
  "scale_embedding": false,
47
+ "transformers_version": "4.34.0.dev0",
48
  "use_cache": true,
49
  "vocab_size": 50265
50
  }
quantize_config.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Erf",
8
+ "NonZero",
9
+ "Tanh",
10
+ "ReduceMean",
11
+ "Reshape",
12
+ "Transpose",
13
+ "Equal",
14
+ "Pow",
15
+ "Slice",
16
+ "Where",
17
+ "ScatterND",
18
+ "Expand",
19
+ "Shape",
20
+ "Concat",
21
+ "MatMul",
22
+ "Sqrt",
23
+ "Range",
24
+ "Less",
25
+ "Add",
26
+ "Gather",
27
+ "Unsqueeze",
28
+ "Div",
29
+ "Gemm",
30
+ "Constant",
31
+ "Mul",
32
+ "Softmax",
33
+ "Squeeze",
34
+ "ConstantOfShape",
35
+ "Cast",
36
+ "GatherND",
37
+ "Sub"
38
+ ],
39
+ "weight_type": "QInt8"
40
+ }
41
+ }
42
+ }