Xenova HF staff commited on
Commit
9f81ce6
1 Parent(s): 1ef5407

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -55,7 +55,7 @@
55
  "scale_embedding": true,
56
  "share_encoder_decoder_embeddings": true,
57
  "static_position_embeddings": true,
58
- "transformers_version": "4.32.0.dev0",
59
  "use_cache": true,
60
  "vocab_size": 59514
61
  }
 
55
  "scale_embedding": true,
56
  "share_encoder_decoder_embeddings": true,
57
  "static_position_embeddings": true,
58
+ "transformers_version": "4.34.0.dev0",
59
  "use_cache": true,
60
  "vocab_size": 59514
61
  }
generation_config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_from_model_config": true,
3
  "bad_words_ids": [
4
  [
5
  59513
@@ -12,5 +11,6 @@
12
  "max_length": 512,
13
  "num_beams": 4,
14
  "pad_token_id": 59513,
15
- "transformers_version": "4.32.0.dev0"
 
16
  }
 
1
  {
 
2
  "bad_words_ids": [
3
  [
4
  59513
 
11
  "max_length": 512,
12
  "num_beams": 4,
13
  "pad_token_id": 59513,
14
+ "renormalize_logits": true,
15
+ "transformers_version": "4.34.0.dev0"
16
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73941d52cb71e837776a0f5ffafedc363884693c06e645f3544ba7de606fcf09
3
- size 346228960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:991e217b5f162b2578726b483d77f06c70ef03fa0caba5d3d5afa699fa5347c0
3
+ size 224344345
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41f3a332db9b84ef21d284d0930d16af12d9a76eabc0fa5e9349da8f83f87ef4
3
- size 346464442
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d87fdd0e4f16e9ea2b58148624bf58ed64cec7c2c0e8d87bb82f4142b80bad57
3
+ size 224579912
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:256385187890459cb335331afca437d1ff7d495ae41831837e79731f05825188
3
- size 88151662
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:333b244bce16023df04541c8cf9fd60aec9b0569da393c4b831d561897b0bda8
3
+ size 57381512
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27b4e745bb2821200eb0fbae7cccfa6389d25761dcdcb87f07f89b8014fb9e68
3
- size 87780306
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdacc5f38e4d2b805a2fc9f38cf43844cdea56666e735137dbacf2a54a785257
3
+ size 57010810
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0cd561f5e0eeefc62d2b903182e5dc341a3779fde1ccd04cdd92662ad5849180
3
- size 333578451
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f79d20e4418b976072f43f7a7a210c9bb62c6a463bff3f07d1ba7b0209b01989
3
+ size 211693836
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a444f7b9da77cc7935a7b65c9e4ce97e78f87be3d8c038ff4af22dd17b3f9c7
3
- size 84508842
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb654354a5cdebf5422cc681e76de54b1f4861e66840a476489be505c8792ad9
3
+ size 53739346
quantize_config.json CHANGED
@@ -4,120 +4,120 @@
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
- "Add",
8
- "Transpose",
9
- "ReduceMean",
 
10
  "MatMul",
11
- "Mul",
12
  "Expand",
 
 
 
 
 
 
 
 
13
  "Sigmoid",
14
  "Concat",
15
- "Constant",
16
  "Sub",
17
- "Reshape",
18
- "Unsqueeze",
19
- "Cast",
20
- "Equal",
21
- "Sqrt",
22
- "Shape",
23
- "Gather",
24
  "Softmax",
25
- "ConstantOfShape",
26
  "Pow",
27
- "Where",
28
- "Range",
29
- "Div"
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
- "Add",
36
- "Transpose",
37
- "ReduceMean",
 
38
  "MatMul",
39
- "Mul",
40
  "Expand",
 
 
 
 
 
 
 
 
41
  "Sigmoid",
42
  "Concat",
43
- "Constant",
44
  "Sub",
45
- "Reshape",
46
- "Unsqueeze",
47
- "Equal",
48
- "Cast",
49
- "Sqrt",
50
- "Shape",
51
- "Gather",
52
  "Softmax",
53
- "ConstantOfShape",
54
  "Pow",
55
- "Where",
56
- "Range",
57
- "Div"
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
- "decoder_model": {
62
  "op_types": [
63
- "Add",
64
- "Transpose",
65
- "ReduceMean",
 
 
 
66
  "MatMul",
 
 
67
  "Expand",
 
 
 
68
  "Mul",
 
 
 
 
 
69
  "Sigmoid",
70
  "Concat",
71
- "Constant",
72
- "Less",
73
  "Sub",
74
- "Squeeze",
75
- "Reshape",
76
- "Unsqueeze",
77
- "Cast",
78
- "Equal",
79
- "Sqrt",
80
- "Shape",
81
- "Gather",
82
- "ConstantOfShape",
83
  "Softmax",
84
- "Slice",
85
  "Pow",
86
- "Where",
87
- "Range",
88
- "Div"
89
  ],
90
  "weight_type": "QInt8"
91
  },
92
- "decoder_model_merged": {
93
  "op_types": [
94
- "Add",
95
- "Transpose",
96
- "ReduceMean",
97
- "Mul",
98
- "Expand",
99
- "MatMul",
100
- "Sigmoid",
101
- "Concat",
102
- "Constant",
103
- "Less",
104
- "Sub",
105
  "Squeeze",
106
- "Reshape",
 
107
  "Unsqueeze",
108
- "Cast",
 
 
 
 
 
109
  "Equal",
110
  "Sqrt",
111
- "Shape",
112
- "If",
113
- "Gather",
 
 
114
  "ConstantOfShape",
 
 
 
 
115
  "Softmax",
116
- "Slice",
117
  "Pow",
118
- "Where",
119
- "Range",
120
- "Div"
121
  ],
122
  "weight_type": "QInt8"
123
  }
 
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
+ "Gather",
8
+ "Unsqueeze",
9
+ "Shape",
10
+ "Range",
11
  "MatMul",
12
+ "Reshape",
13
  "Expand",
14
+ "Transpose",
15
+ "Equal",
16
+ "Sqrt",
17
+ "Mul",
18
+ "ReduceMean",
19
+ "Cast",
20
+ "Constant",
21
+ "ConstantOfShape",
22
  "Sigmoid",
23
  "Concat",
24
+ "Add",
25
  "Sub",
 
 
 
 
 
 
 
26
  "Softmax",
27
+ "Div",
28
  "Pow",
29
+ "Where"
 
 
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
+ "Gather",
36
+ "Unsqueeze",
37
+ "Shape",
38
+ "Range",
39
  "MatMul",
40
+ "Reshape",
41
  "Expand",
42
+ "Transpose",
43
+ "Equal",
44
+ "Sqrt",
45
+ "Mul",
46
+ "ReduceMean",
47
+ "Cast",
48
+ "Constant",
49
+ "ConstantOfShape",
50
  "Sigmoid",
51
  "Concat",
 
52
  "Sub",
53
+ "Add",
 
 
 
 
 
 
54
  "Softmax",
55
+ "Div",
56
  "Pow",
57
+ "Where"
 
 
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
+ "decoder_model_merged": {
62
  "op_types": [
63
+ "Squeeze",
64
+ "Gather",
65
+ "Less",
66
+ "Unsqueeze",
67
+ "Shape",
68
+ "Range",
69
  "MatMul",
70
+ "Reshape",
71
+ "If",
72
  "Expand",
73
+ "Transpose",
74
+ "Equal",
75
+ "Sqrt",
76
  "Mul",
77
+ "ReduceMean",
78
+ "Cast",
79
+ "Constant",
80
+ "Slice",
81
+ "ConstantOfShape",
82
  "Sigmoid",
83
  "Concat",
84
+ "Add",
 
85
  "Sub",
 
 
 
 
 
 
 
 
 
86
  "Softmax",
87
+ "Div",
88
  "Pow",
89
+ "Where"
 
 
90
  ],
91
  "weight_type": "QInt8"
92
  },
93
+ "decoder_model": {
94
  "op_types": [
 
 
 
 
 
 
 
 
 
 
 
95
  "Squeeze",
96
+ "Gather",
97
+ "Less",
98
  "Unsqueeze",
99
+ "Shape",
100
+ "Range",
101
+ "MatMul",
102
+ "Reshape",
103
+ "Expand",
104
+ "Transpose",
105
  "Equal",
106
  "Sqrt",
107
+ "Mul",
108
+ "ReduceMean",
109
+ "Cast",
110
+ "Constant",
111
+ "Slice",
112
  "ConstantOfShape",
113
+ "Sigmoid",
114
+ "Concat",
115
+ "Add",
116
+ "Sub",
117
  "Softmax",
118
+ "Div",
119
  "Pow",
120
+ "Where"
 
 
121
  ],
122
  "weight_type": "QInt8"
123
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff