Xenova HF staff commited on
Commit
19012ac
1 Parent(s): 2322319

Upload folder using huggingface_hub

Browse files
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b53ee5a5ccf91dad271e6de1aa38189b2326d67fd1fdedcb9a391cd51333e0e
3
- size 348872491
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92db26402a4674e94b78e6f1b4c459f5dfa257b5f6a944696240c87594c25532
3
+ size 348843867
onnx/decoder_model_merged_bnb4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d981bfb3710d94c11749ff3cb6a1762be393e9021d01b0c77d312376fdeaac9
3
- size 233534625
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebd351112c6b9492b2bf2bb15b1a2d935f4f38261ef7c89db936ce086b024456
3
+ size 233506001
onnx/decoder_model_merged_fp16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa6d2c9f9ec665b90cf447e92652e8626f8622d9593834e52cadc135c99e99dd
3
- size 174558131
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2dcf943b868d04eb30f99315ff0b93ba6bacbf19190ef1ea8f3a7eaed29e635
3
+ size 174610059
onnx/decoder_model_merged_int8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ff9cc1f5ec7150f5085aa15044d923fbdf392c92f86916a87d005505283682f
3
- size 301363513
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:202be61c83f3830c25844bff2b74b0297828ddf53f9696f31a8f5f6815d40d8a
3
+ size 88980775
onnx/decoder_model_merged_q4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:09985c682350705128c03670eb194050df8451c51ef8c5fbb72ae76e3e0cb4d9
3
- size 235631471
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:926177238243860750ac395fed2cfe63da6c4ecdf6f1cebb71bc4ad292d8d3c9
3
+ size 235602847
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ff9cc1f5ec7150f5085aa15044d923fbdf392c92f86916a87d005505283682f
3
- size 301363513
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:202be61c83f3830c25844bff2b74b0297828ddf53f9696f31a8f5f6815d40d8a
3
+ size 88980775
onnx/decoder_model_merged_uint8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d0a1c88d4326f0075ea7866eeb1a7d48ac3489d28b2253eb97406482209e604
3
- size 301363506
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3eedb66af82477bccaaecb186f69b7f59941bfb12270639544b70e155ab25994
3
+ size 88980786
onnx/encoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87ce60aae236f0306d5689f0a26d3cfb4ed93548716ce1d9ecca5d9dbfbe9ead
3
- size 1229214934
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd0ef9a15a8491d80add27d04f9d22e11543f26ff8ccdd8d72034aba28704f76
3
+ size 1229351354
onnx/encoder_model_bnb4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:affe1219278db31e47e26835c872bdfdaa35db62357b7632639a98fff11d7849
3
- size 191147368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43f09b742cfd01b1bed0e1b798acc8f476a1e5b3bd6fdb77d7fd776c483edf7c
3
+ size 191283788
onnx/encoder_model_fp16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:778d55314e55fe9b67b2c7971cd03c5fcfe08a795cf63323de7cb994a28e2c5c
3
- size 614782019
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a21bad736df71ff52bb23a646a11534eceb659720868fdcf3ed68b90cae60c4
3
+ size 615124148
onnx/encoder_model_int8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8948bf97b094f560bb843294a0aeb9e65588f02d88febc41ef7c589a4881d281
3
- size 313220478
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c1a6fdbf77f383f63fba8428d5635e5d404d0862a24cfd49057e6dc6ab11e9e
3
+ size 313562621
onnx/encoder_model_q4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be332e57b058bf3edebaaa135e97511a0ac0ead2d90a960755357e588c0c4411
3
- size 210020560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca56d971bbfd94e8819a1787b09f1ab73f0aa745023ef2b3b7a2c7e620ba31bd
3
+ size 210156980
onnx/encoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3a0619e8051e8dab1e65e2b653617bacb003dbfc45130f03f0c8ebce2d3d565
3
- size 313220547
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cba66774b515bea3b260266572bba513e0266c9a36e463501c87ee3aecc28e26
3
+ size 313562690
onnx/encoder_model_uint8.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3a0619e8051e8dab1e65e2b653617bacb003dbfc45130f03f0c8ebce2d3d565
3
- size 313220547
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cba66774b515bea3b260266572bba513e0266c9a36e463501c87ee3aecc28e26
3
+ size 313562690
quantize_config.json CHANGED
@@ -5,18 +5,23 @@
5
  "encoder_model": {
6
  "op_types": [
7
  "Add",
 
 
8
  "Conv",
9
  "Div",
10
  "Erf",
 
11
  "MatMul",
12
  "Mul",
13
  "Pow",
14
  "ReduceMean",
15
  "Reshape",
 
16
  "Softmax",
17
  "Sqrt",
18
  "Sub",
19
- "Transpose"
 
20
  ],
21
  "weight_type": "QUInt8"
22
  },
@@ -77,6 +82,7 @@
77
  "decoder_model_merged": {
78
  "op_types": [
79
  "Add",
 
80
  "Concat",
81
  "Constant",
82
  "ConstantOfShape",
@@ -114,18 +120,23 @@
114
  "encoder_model": {
115
  "op_types": [
116
  "Add",
 
 
117
  "Conv",
118
  "Div",
119
  "Erf",
 
120
  "MatMul",
121
  "Mul",
122
  "Pow",
123
  "ReduceMean",
124
  "Reshape",
 
125
  "Softmax",
126
  "Sqrt",
127
  "Sub",
128
- "Transpose"
 
129
  ],
130
  "weight_type": "QInt8"
131
  },
@@ -186,6 +197,7 @@
186
  "decoder_model_merged": {
187
  "op_types": [
188
  "Add",
 
189
  "Concat",
190
  "Constant",
191
  "ConstantOfShape",
@@ -223,18 +235,23 @@
223
  "encoder_model": {
224
  "op_types": [
225
  "Add",
 
 
226
  "Conv",
227
  "Div",
228
  "Erf",
 
229
  "MatMul",
230
  "Mul",
231
  "Pow",
232
  "ReduceMean",
233
  "Reshape",
 
234
  "Softmax",
235
  "Sqrt",
236
  "Sub",
237
- "Transpose"
 
238
  ],
239
  "weight_type": "QUInt8"
240
  },
@@ -295,6 +312,7 @@
295
  "decoder_model_merged": {
296
  "op_types": [
297
  "Add",
 
298
  "Concat",
299
  "Constant",
300
  "ConstantOfShape",
 
5
  "encoder_model": {
6
  "op_types": [
7
  "Add",
8
+ "Concat",
9
+ "Constant",
10
  "Conv",
11
  "Div",
12
  "Erf",
13
+ "Gather",
14
  "MatMul",
15
  "Mul",
16
  "Pow",
17
  "ReduceMean",
18
  "Reshape",
19
+ "Shape",
20
  "Softmax",
21
  "Sqrt",
22
  "Sub",
23
+ "Transpose",
24
+ "Unsqueeze"
25
  ],
26
  "weight_type": "QUInt8"
27
  },
 
82
  "decoder_model_merged": {
83
  "op_types": [
84
  "Add",
85
+ "Cast",
86
  "Concat",
87
  "Constant",
88
  "ConstantOfShape",
 
120
  "encoder_model": {
121
  "op_types": [
122
  "Add",
123
+ "Concat",
124
+ "Constant",
125
  "Conv",
126
  "Div",
127
  "Erf",
128
+ "Gather",
129
  "MatMul",
130
  "Mul",
131
  "Pow",
132
  "ReduceMean",
133
  "Reshape",
134
+ "Shape",
135
  "Softmax",
136
  "Sqrt",
137
  "Sub",
138
+ "Transpose",
139
+ "Unsqueeze"
140
  ],
141
  "weight_type": "QInt8"
142
  },
 
197
  "decoder_model_merged": {
198
  "op_types": [
199
  "Add",
200
+ "Cast",
201
  "Concat",
202
  "Constant",
203
  "ConstantOfShape",
 
235
  "encoder_model": {
236
  "op_types": [
237
  "Add",
238
+ "Concat",
239
+ "Constant",
240
  "Conv",
241
  "Div",
242
  "Erf",
243
+ "Gather",
244
  "MatMul",
245
  "Mul",
246
  "Pow",
247
  "ReduceMean",
248
  "Reshape",
249
+ "Shape",
250
  "Softmax",
251
  "Sqrt",
252
  "Sub",
253
+ "Transpose",
254
+ "Unsqueeze"
255
  ],
256
  "weight_type": "QUInt8"
257
  },
 
312
  "decoder_model_merged": {
313
  "op_types": [
314
  "Add",
315
+ "Cast",
316
  "Concat",
317
  "Constant",
318
  "ConstantOfShape",