Xenova HF staff commited on
Commit
dba7046
1 Parent(s): 7d229d1

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -20,7 +20,7 @@
20
  "output_past": true,
21
  "pad_token_id": 1,
22
  "position_embedding_type": "absolute",
23
- "transformers_version": "4.29.2",
24
  "type_vocab_size": 1,
25
  "use_cache": true,
26
  "vocab_size": 250002
 
20
  "output_past": true,
21
  "pad_token_id": 1,
22
  "position_embedding_type": "absolute",
23
+ "transformers_version": "4.33.0.dev0",
24
  "type_vocab_size": 1,
25
  "use_cache": true,
26
  "vocab_size": 250002
onnx/model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:188c6b93577e6a112c6e99200ed11f0e2cff105b05e241fd9feed63f8807cc11
3
- size 1881470772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f60fc6d14d071996bee0d007e9fd4eec15403bb5e7c48a6f17773c87311af163
3
+ size 1113464750
onnx/model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6f942f71d623ffdd8d9c971c87fc6b9734918f300128a3bdb5ca0a545204ca0
3
- size 473560803
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8547220520c540258aef930319fa6304a40cdb43c5c859b5ce5a3ee03c92d74
3
+ size 280308773
quantize_config.json ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Sqrt",
8
+ "Expand",
9
+ "Unsqueeze",
10
+ "CumSum",
11
+ "Not",
12
+ "Erf",
13
+ "MatMul",
14
+ "Sub",
15
+ "Constant",
16
+ "ConstantOfShape",
17
+ "ReduceMean",
18
+ "Pow",
19
+ "Div",
20
+ "Softmax",
21
+ "Gather",
22
+ "Cast",
23
+ "Equal",
24
+ "Transpose",
25
+ "Shape",
26
+ "Where",
27
+ "Mul",
28
+ "Add",
29
+ "Concat",
30
+ "Slice",
31
+ "Reshape"
32
+ ],
33
+ "weight_type": "QInt8"
34
+ }
35
+ }
36
+ }