Xenova HF staff commited on
Commit
6842a46
1 Parent(s): c55aaf7

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -36,3 +36,4 @@ tokenizer.json filter=lfs diff=lfs merge=lfs -text
36
  onnx/decoder_model.onnx_data filter=lfs diff=lfs merge=lfs -text
37
  onnx/decoder_model_merged.onnx_data filter=lfs diff=lfs merge=lfs -text
38
  onnx/decoder_with_past_model.onnx_data filter=lfs diff=lfs merge=lfs -text
 
 
36
  onnx/decoder_model.onnx_data filter=lfs diff=lfs merge=lfs -text
37
  onnx/decoder_model_merged.onnx_data filter=lfs diff=lfs merge=lfs -text
38
  onnx/decoder_with_past_model.onnx_data filter=lfs diff=lfs merge=lfs -text
39
+ _model_decoder_embed_positions_Constant_5_attr__value filter=lfs diff=lfs merge=lfs -text
_model_decoder_embed_positions_Constant_5_attr__value ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:613daf130d7105e6e63c6f721a4946bd2f7df255e79255ac886b600cdaa34dbe
3
+ size 4202496
config.json CHANGED
@@ -28,7 +28,7 @@
28
  "pad_token_id": 1,
29
  "scale_embedding": true,
30
  "tokenizer_class": "NllbTokenizer",
31
- "transformers_version": "4.29.2",
32
  "use_cache": true,
33
  "vocab_size": 256206
34
  }
 
28
  "pad_token_id": 1,
29
  "scale_embedding": true,
30
  "tokenizer_class": "NllbTokenizer",
31
+ "transformers_version": "4.33.0.dev0",
32
  "use_cache": true,
33
  "vocab_size": 256206
34
  }
generation_config.json CHANGED
@@ -5,5 +5,5 @@
5
  "eos_token_id": 2,
6
  "max_length": 200,
7
  "pad_token_id": 1,
8
- "transformers_version": "4.29.2"
9
  }
 
5
  "eos_token_id": 2,
6
  "max_length": 200,
7
  "pad_token_id": 1,
8
+ "transformers_version": "4.33.0.dev0"
9
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fdeccfd3ba96e8aee7dd045f83182507cba589ca5410642b13b23d3b685041ff
3
- size 562636
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb0e0eba116a5f6491686c5902f41df9ab5919c33a93c2ca088df6091de8856e
3
+ size 1860454885
onnx/decoder_model.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a09a3713a8de670fe3d587c7faf36e8d3fad471d2ca87f6029476e6ec74dc811
3
- size 2909290496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66d476d102b3db1819e99a96c154afde049273728e6aaaab6ee5adf0e427f102
3
+ size 2905088000
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b5acdac6829a5027d64d687b61339522a6d220f171e282889b8a1181a92e199a
3
- size 1022212
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:004adde69878c3ef0a3fdeea9d4972d901deebeb8f45373f8b2f9abcd15204e9
3
+ size 1865158686
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83bfebbaf034e9c0d64b567a2a601ed5d3dac4904e9cf69e7684db6b9ee103d8
3
- size 731672253
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd66608c2a4194e78f95548fa0e64f24302303698c5b09fa8e1f9e16ec00676b
3
+ size 475505771
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f66977eeb9c38d7146c7a9c2ff99b98d447080c8184b70485cb0f2e48c8098fd
3
- size 730959620
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddea619b640379609719becf91a488c5e6ce4c4b2052efbb5388edaed465a552
3
+ size 470533055
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94d5dfbf3bf2c016442dd34e44438007cd42eb8f9b40103f4eb3d34a42a5d9e2
3
- size 475281
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a786f1fd7c4e961dabd49077f071373ed6f93771ce3bbdd5af6d1fda779522b4
3
+ size 1759606543
onnx/decoder_with_past_model.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b0427f278d242d85a0bfd7ba91eb2f8b7d4f077d956a9a800962e7bf81010ec7
3
- size 2808528896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab3deb104bebee00493919111f377566301e2b00ca37168252f9155ef6953c06
3
+ size 2804326400
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6978ddd13eae91cedf4eaa101101976a1e50cc7b13f1f254996c66217854b0d1
3
- size 705433687
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:374293cb4bb59cd29810851a7cfbc568accb8efdc1a953ac04722e30adaf2d0b
3
+ size 445006987
onnx/encoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eec9001dfa16b09cc0bed3a35904827675a3f0506d23cbf7683e1deb43184d3e
3
- size 1658468857
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3d9f99355917d6cce7423456645e13a3a2a9f1301bfc000548d5c8960407714
3
+ size 1658468942
onnx/encoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:56f9138d4d64c187216a562bc3c78b1373cbfceaefb8f20b686e55484ab78eec
3
- size 415968804
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cde664eacba07a62f198857ec6c06e09572b1ebb77c8137f1fa99ac604a3a28
3
+ size 419120483
quantize_config.json ADDED
@@ -0,0 +1,131 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "decoder_model": {
6
+ "op_types": [
7
+ "Less",
8
+ "Where",
9
+ "ReduceMean",
10
+ "Relu",
11
+ "Slice",
12
+ "ConstantOfShape",
13
+ "CumSum",
14
+ "Range",
15
+ "MatMul",
16
+ "Concat",
17
+ "Pow",
18
+ "Gather",
19
+ "Not",
20
+ "Constant",
21
+ "Unsqueeze",
22
+ "Div",
23
+ "Transpose",
24
+ "Softmax",
25
+ "Reshape",
26
+ "Mul",
27
+ "Equal",
28
+ "Squeeze",
29
+ "Cast",
30
+ "Expand",
31
+ "Sub",
32
+ "Shape",
33
+ "Sqrt",
34
+ "Add"
35
+ ],
36
+ "weight_type": "QInt8"
37
+ },
38
+ "encoder_model": {
39
+ "op_types": [
40
+ "ReduceMean",
41
+ "Where",
42
+ "Relu",
43
+ "CumSum",
44
+ "ConstantOfShape",
45
+ "MatMul",
46
+ "Concat",
47
+ "Pow",
48
+ "Gather",
49
+ "Not",
50
+ "Constant",
51
+ "Unsqueeze",
52
+ "Div",
53
+ "Transpose",
54
+ "Softmax",
55
+ "Reshape",
56
+ "Mul",
57
+ "Equal",
58
+ "Cast",
59
+ "Expand",
60
+ "Sub",
61
+ "Sqrt",
62
+ "Shape",
63
+ "Add"
64
+ ],
65
+ "weight_type": "QInt8"
66
+ },
67
+ "decoder_model_merged": {
68
+ "op_types": [
69
+ "Less",
70
+ "Where",
71
+ "ReduceMean",
72
+ "Relu",
73
+ "Slice",
74
+ "ConstantOfShape",
75
+ "CumSum",
76
+ "Range",
77
+ "MatMul",
78
+ "Concat",
79
+ "Pow",
80
+ "Gather",
81
+ "Not",
82
+ "Constant",
83
+ "Unsqueeze",
84
+ "Div",
85
+ "Transpose",
86
+ "Softmax",
87
+ "Reshape",
88
+ "Mul",
89
+ "Equal",
90
+ "Squeeze",
91
+ "Cast",
92
+ "Expand",
93
+ "Sub",
94
+ "If",
95
+ "Shape",
96
+ "Sqrt",
97
+ "Add"
98
+ ],
99
+ "weight_type": "QInt8"
100
+ },
101
+ "decoder_with_past_model": {
102
+ "op_types": [
103
+ "ReduceMean",
104
+ "Where",
105
+ "Relu",
106
+ "ConstantOfShape",
107
+ "CumSum",
108
+ "MatMul",
109
+ "Concat",
110
+ "Pow",
111
+ "Gather",
112
+ "Not",
113
+ "Constant",
114
+ "Unsqueeze",
115
+ "Div",
116
+ "Transpose",
117
+ "Softmax",
118
+ "Reshape",
119
+ "Mul",
120
+ "Equal",
121
+ "Cast",
122
+ "Expand",
123
+ "Sub",
124
+ "Sqrt",
125
+ "Shape",
126
+ "Add"
127
+ ],
128
+ "weight_type": "QInt8"
129
+ }
130
+ }
131
+ }