Xenova HF staff commited on
Commit
9ed28a3
1 Parent(s): 859d73b

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -54,7 +54,7 @@
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
- "transformers_version": "4.32.0.dev0",
58
  "use_cache": true,
59
  "vocab_size": 80035
60
  }
 
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
+ "transformers_version": "4.34.0.dev0",
58
  "use_cache": true,
59
  "vocab_size": 80035
60
  }
generation_config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_from_model_config": true,
3
  "bad_words_ids": [
4
  [
5
  80034
@@ -12,5 +11,6 @@
12
  "max_length": 512,
13
  "num_beams": 4,
14
  "pad_token_id": 80034,
15
- "transformers_version": "4.32.0.dev0"
 
16
  }
 
1
  {
 
2
  "bad_words_ids": [
3
  [
4
  80034
 
11
  "max_length": 512,
12
  "num_beams": 4,
13
  "pad_token_id": 80034,
14
+ "renormalize_logits": true,
15
+ "transformers_version": "4.34.0.dev0"
16
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25d921015a99299b825bbce49beff2340bb2e317c8e98581660e2cdcabd3314c
3
- size 430365060
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc00c770b9673d1e4dccee64f90ba447f4cc21af0c5870f6bd77a5d1c5fdbbe3
3
+ size 266453437
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:07f4ccd3204c846584b9c4ccade338459d23e0db7a9fa9bcf411197369bafa7b
3
- size 430600542
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afd25b3921ea9404fe998ff5927890f3eea6e34d4f2fa67693fc476d4c79f6b2
3
+ size 266689004
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea3147478a2199f55e8efd10661e7afc78fd42637cbb4b81bf86ff50595aa89a
3
- size 109349855
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9db146ed7665ea7d437dc4df564e3af5df923366de4d52aaf2c4b4e3e4ae4f1
3
+ size 67970348
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:783a8f054c54e07982da09fd112e501ed35bdc9be8f251aa3cf78f5f76eb3d97
3
- size 108978499
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5c77fd7f60eebdf81d3f6f6fecd8e6804529cbcbecc2bb742fd60f225e2cf3e
3
+ size 67599646
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27e09a6dd9b02284b6aeeaed939150b82779af3ccbef8d6ce06a5ac74f24542f
3
- size 417714551
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65bacf0a6202d80d176b3634d4e8bc6098bb9a6259e24ba7ea64485c258bcee9
3
+ size 253802928
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1b09d1b6257c28fcc012b02d64d289d14c7751316bf167e4050daeaab171fca
3
- size 105707035
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f3d4bd7495686b317ab2e8302805830b0d02899b75ab503d78837c9af99383c
3
+ size 64328182
quantize_config.json CHANGED
@@ -4,120 +4,120 @@
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
- "Mul",
8
- "Cast",
9
- "Div",
10
- "Where",
11
  "Unsqueeze",
12
- "Concat",
13
- "Reshape",
 
14
  "Add",
15
- "MatMul",
16
- "Sigmoid",
17
- "Sqrt",
18
- "Sub",
19
- "ReduceMean",
20
- "ConstantOfShape",
21
  "Expand",
22
- "Shape",
23
  "Constant",
24
- "Gather",
25
- "Equal",
26
  "Transpose",
 
 
 
 
 
 
 
 
27
  "Pow",
 
 
28
  "Range",
29
- "Softmax"
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
- "Mul",
36
- "Cast",
37
- "Div",
38
- "Where",
39
  "Unsqueeze",
40
- "Concat",
41
- "Reshape",
 
42
  "Add",
43
- "MatMul",
44
- "Sigmoid",
45
- "Sqrt",
46
- "Sub",
47
- "ReduceMean",
48
- "ConstantOfShape",
49
  "Expand",
50
- "Shape",
51
  "Constant",
52
- "Gather",
53
- "Equal",
54
  "Transpose",
 
 
 
 
 
 
 
 
55
  "Pow",
 
 
56
  "Range",
57
- "Softmax"
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
- "decoder_model": {
62
  "op_types": [
63
- "Mul",
64
- "Cast",
65
- "Div",
66
- "Where",
67
  "Unsqueeze",
68
- "Less",
69
- "Concat",
70
- "Reshape",
71
  "Add",
72
- "MatMul",
73
- "Sigmoid",
74
- "Sqrt",
75
- "Sub",
76
- "ReduceMean",
77
- "ConstantOfShape",
78
  "Expand",
79
- "Shape",
80
  "Constant",
81
- "Gather",
82
- "Equal",
83
  "Transpose",
 
 
 
 
 
84
  "Slice",
 
 
 
 
 
 
85
  "Squeeze",
 
86
  "Range",
87
- "Pow",
88
- "Softmax"
89
  ],
90
  "weight_type": "QInt8"
91
  },
92
- "decoder_model_merged": {
93
  "op_types": [
94
- "Mul",
95
- "Cast",
96
- "Div",
97
- "Where",
98
  "Unsqueeze",
99
- "Less",
100
- "Concat",
101
- "Reshape",
102
  "Add",
103
- "MatMul",
104
- "Sigmoid",
105
- "Sqrt",
106
- "Sub",
107
- "If",
108
- "ConstantOfShape",
109
- "ReduceMean",
110
  "Expand",
111
- "Shape",
112
  "Constant",
113
- "Gather",
114
- "Equal",
115
  "Transpose",
 
 
 
 
 
116
  "Slice",
 
 
 
 
 
 
117
  "Squeeze",
 
118
  "Range",
119
- "Pow",
120
- "Softmax"
121
  ],
122
  "weight_type": "QInt8"
123
  }
 
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
+ "Shape",
 
 
 
8
  "Unsqueeze",
9
+ "Gather",
10
+ "Softmax",
11
+ "Where",
12
  "Add",
 
 
 
 
 
 
13
  "Expand",
14
+ "Cast",
15
  "Constant",
 
 
16
  "Transpose",
17
+ "Sub",
18
+ "ConstantOfShape",
19
+ "Concat",
20
+ "Equal",
21
+ "Sqrt",
22
+ "Sigmoid",
23
+ "Div",
24
+ "Mul",
25
  "Pow",
26
+ "MatMul",
27
+ "ReduceMean",
28
  "Range",
29
+ "Reshape"
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
+ "Shape",
 
 
 
36
  "Unsqueeze",
37
+ "Gather",
38
+ "Softmax",
39
+ "Where",
40
  "Add",
 
 
 
 
 
 
41
  "Expand",
42
+ "Cast",
43
  "Constant",
 
 
44
  "Transpose",
45
+ "Sub",
46
+ "ConstantOfShape",
47
+ "Concat",
48
+ "Equal",
49
+ "Sqrt",
50
+ "Sigmoid",
51
+ "Div",
52
+ "Mul",
53
  "Pow",
54
+ "MatMul",
55
+ "ReduceMean",
56
  "Range",
57
+ "Reshape"
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
+ "decoder_model_merged": {
62
  "op_types": [
63
+ "Shape",
64
+ "If",
 
 
65
  "Unsqueeze",
66
+ "Gather",
67
+ "Softmax",
68
+ "Where",
69
  "Add",
 
 
 
 
 
 
70
  "Expand",
71
+ "Cast",
72
  "Constant",
 
 
73
  "Transpose",
74
+ "Less",
75
+ "Sub",
76
+ "ConstantOfShape",
77
+ "Concat",
78
+ "Equal",
79
  "Slice",
80
+ "Sqrt",
81
+ "Sigmoid",
82
+ "Div",
83
+ "Mul",
84
+ "Pow",
85
+ "MatMul",
86
  "Squeeze",
87
+ "ReduceMean",
88
  "Range",
89
+ "Reshape"
 
90
  ],
91
  "weight_type": "QInt8"
92
  },
93
+ "decoder_model": {
94
  "op_types": [
95
+ "Shape",
 
 
 
96
  "Unsqueeze",
97
+ "Gather",
98
+ "Softmax",
99
+ "Where",
100
  "Add",
 
 
 
 
 
 
 
101
  "Expand",
102
+ "Cast",
103
  "Constant",
 
 
104
  "Transpose",
105
+ "Less",
106
+ "Sub",
107
+ "ConstantOfShape",
108
+ "Concat",
109
+ "Equal",
110
  "Slice",
111
+ "Sqrt",
112
+ "Sigmoid",
113
+ "Div",
114
+ "Mul",
115
+ "Pow",
116
+ "MatMul",
117
  "Squeeze",
118
+ "ReduceMean",
119
  "Range",
120
+ "Reshape"
 
121
  ],
122
  "weight_type": "QInt8"
123
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff