Xenova HF staff commited on
Commit
d9d18a0
1 Parent(s): 624e461

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -54,7 +54,7 @@
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
- "transformers_version": "4.32.0.dev0",
58
  "use_cache": true,
59
  "vocab_size": 35464
60
  }
 
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
+ "transformers_version": "4.34.0.dev0",
58
  "use_cache": true,
59
  "vocab_size": 35464
60
  }
generation_config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_from_model_config": true,
3
  "bad_words_ids": [
4
  [
5
  35463
@@ -12,5 +11,6 @@
12
  "max_length": 512,
13
  "num_beams": 4,
14
  "pad_token_id": 35463,
15
- "transformers_version": "4.32.0.dev0"
 
16
  }
 
1
  {
 
2
  "bad_words_ids": [
3
  [
4
  35463
 
11
  "max_length": 512,
12
  "num_beams": 4,
13
  "pad_token_id": 35463,
14
+ "renormalize_logits": true,
15
+ "transformers_version": "4.34.0.dev0"
16
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:906d24158b6abfff73d3f3a9477d8774581e9008599b149a931b17f683b07297
3
- size 247623959
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6abd546a59f79bdbc04e3258fc072a17f6b2ea39ef7e92d45588cdccbf58bacc
3
+ size 174993745
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c14b770d42c0f0473d701b621e0eabafbd265f0d9a8f235ca54c2e974c71df3e
3
- size 247859441
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a31980303aa38a40bb64c8c04bbce8c84a659a1b132202fe8c21070f0a98cf3
3
+ size 175229312
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ff747091aa9705f539cb2bac07d05c372e4fea14d1416737110a5d603317999
3
- size 63308012
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdab252b615eaac60d09d94a7d5c28fa9b588d87f00d5f56c2780bacc6fbf41c
3
+ size 44971712
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9fbabbde316b1324624889f16dd8a3a55d5930ac51c3780be63a1b1591cd1349
3
- size 62936656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:240ba81c9660d30c17ea4eb79857e04ff208146c90e059a8ffa5f84a6c3bc3e3
3
+ size 44601010
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cfcec3347c1201a5692f1b5e83d3d4657b48177d40a0ab760e39a34ca2d6c705
3
- size 234973450
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60517355b849a7744d9a9b54ed1d71aad9f54406a71c092cc51716c91eeb7ee8
3
+ size 162343236
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b580c5bba606c6e74f6496e56687bf722882d7e56f09cac19c22b87352232ce1
3
- size 59665192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7428bf11240654a05996c6a4b802cc25a1ba97302fe653fef8452f52a2a797a8
3
+ size 41329546
quantize_config.json CHANGED
@@ -4,120 +4,120 @@
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
- "Equal",
 
8
  "Shape",
9
- "Concat",
 
 
 
 
10
  "Where",
 
11
  "ConstantOfShape",
12
- "Reshape",
13
- "Div",
14
- "Softmax",
15
- "Sigmoid",
16
- "Transpose",
17
  "Sqrt",
18
- "Expand",
19
- "Cast",
20
  "Gather",
21
- "Constant",
22
- "Unsqueeze",
23
- "Sub",
24
- "Range",
25
- "ReduceMean",
26
  "Mul",
27
- "Add",
28
- "MatMul",
29
- "Pow"
 
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
- "Equal",
 
36
  "Shape",
37
- "Concat",
 
 
 
 
38
  "Where",
 
39
  "ConstantOfShape",
40
- "Reshape",
41
- "Div",
42
- "Softmax",
43
- "Sigmoid",
44
- "Transpose",
45
  "Sqrt",
46
- "Expand",
47
- "Cast",
48
  "Gather",
49
- "Constant",
50
- "Unsqueeze",
51
- "Sub",
52
- "Range",
53
- "ReduceMean",
54
  "Mul",
55
- "Add",
56
- "MatMul",
57
- "Pow"
 
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
- "decoder_model": {
62
  "op_types": [
63
- "Equal",
 
 
64
  "Shape",
65
- "Concat",
66
  "Slice",
 
 
 
 
 
67
  "Where",
 
68
  "ConstantOfShape",
69
- "Reshape",
70
- "Div",
71
- "Squeeze",
72
- "Softmax",
73
- "Sigmoid",
74
- "Transpose",
75
  "Sqrt",
76
- "Expand",
77
- "Cast",
 
78
  "Gather",
79
- "Constant",
80
  "Less",
81
- "Unsqueeze",
82
- "Sub",
83
- "Range",
84
- "ReduceMean",
85
  "Mul",
86
- "Add",
87
- "MatMul",
88
- "Pow"
 
89
  ],
90
  "weight_type": "QInt8"
91
  },
92
- "decoder_model_merged": {
93
  "op_types": [
94
- "Equal",
 
 
95
  "Shape",
96
- "Concat",
97
  "Slice",
 
 
 
 
 
98
  "Where",
 
99
  "ConstantOfShape",
100
- "Reshape",
101
- "Div",
102
- "Squeeze",
103
- "If",
104
- "Softmax",
105
- "Sigmoid",
106
- "Transpose",
107
  "Sqrt",
108
- "Expand",
109
- "Cast",
110
  "Gather",
111
- "Constant",
112
  "Less",
113
- "Unsqueeze",
114
- "Sub",
115
- "Range",
116
- "ReduceMean",
117
  "Mul",
118
- "Add",
119
- "MatMul",
120
- "Pow"
 
121
  ],
122
  "weight_type": "QInt8"
123
  }
 
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
+ "Sigmoid",
8
+ "Add",
9
  "Shape",
10
+ "ReduceMean",
11
+ "Cast",
12
+ "Sub",
13
+ "Transpose",
14
+ "Constant",
15
  "Where",
16
+ "Unsqueeze",
17
  "ConstantOfShape",
 
 
 
 
 
18
  "Sqrt",
19
+ "Concat",
20
+ "MatMul",
21
  "Gather",
22
+ "Reshape",
23
+ "Pow",
24
+ "Div",
 
 
25
  "Mul",
26
+ "Equal",
27
+ "Range",
28
+ "Softmax",
29
+ "Expand"
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
+ "Sigmoid",
36
+ "Add",
37
  "Shape",
38
+ "ReduceMean",
39
+ "Cast",
40
+ "Sub",
41
+ "Transpose",
42
+ "Constant",
43
  "Where",
44
+ "Unsqueeze",
45
  "ConstantOfShape",
 
 
 
 
 
46
  "Sqrt",
47
+ "Concat",
48
+ "MatMul",
49
  "Gather",
50
+ "Reshape",
51
+ "Pow",
52
+ "Div",
 
 
53
  "Mul",
54
+ "Equal",
55
+ "Range",
56
+ "Softmax",
57
+ "Expand"
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
+ "decoder_model_merged": {
62
  "op_types": [
63
+ "Sigmoid",
64
+ "Squeeze",
65
+ "Add",
66
  "Shape",
 
67
  "Slice",
68
+ "ReduceMean",
69
+ "Cast",
70
+ "Sub",
71
+ "Transpose",
72
+ "Constant",
73
  "Where",
74
+ "Unsqueeze",
75
  "ConstantOfShape",
 
 
 
 
 
 
76
  "Sqrt",
77
+ "If",
78
+ "Concat",
79
+ "MatMul",
80
  "Gather",
 
81
  "Less",
82
+ "Reshape",
83
+ "Pow",
84
+ "Div",
 
85
  "Mul",
86
+ "Equal",
87
+ "Range",
88
+ "Softmax",
89
+ "Expand"
90
  ],
91
  "weight_type": "QInt8"
92
  },
93
+ "decoder_model": {
94
  "op_types": [
95
+ "Sigmoid",
96
+ "Squeeze",
97
+ "Add",
98
  "Shape",
 
99
  "Slice",
100
+ "ReduceMean",
101
+ "Cast",
102
+ "Sub",
103
+ "Transpose",
104
+ "Constant",
105
  "Where",
106
+ "Unsqueeze",
107
  "ConstantOfShape",
 
 
 
 
 
 
 
108
  "Sqrt",
109
+ "Concat",
110
+ "MatMul",
111
  "Gather",
 
112
  "Less",
113
+ "Reshape",
114
+ "Pow",
115
+ "Div",
 
116
  "Mul",
117
+ "Equal",
118
+ "Range",
119
+ "Softmax",
120
+ "Expand"
121
  ],
122
  "weight_type": "QInt8"
123
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff