Upload quantized ONNX weights
Browse files- onnx/decoder_model_bnb4.onnx +3 -0
- onnx/decoder_model_fp16.onnx +3 -0
- onnx/decoder_model_int8.onnx +3 -0
- onnx/decoder_model_merged_bnb4.onnx +3 -0
- onnx/decoder_model_merged_fp16.onnx +3 -0
- onnx/decoder_model_merged_int8.onnx +3 -0
- onnx/decoder_model_merged_q4.onnx +3 -0
- onnx/decoder_model_merged_quantized.onnx +3 -0
- onnx/decoder_model_merged_uint8.onnx +3 -0
- onnx/decoder_model_q4.onnx +3 -0
- onnx/decoder_model_quantized.onnx +3 -0
- onnx/decoder_model_uint8.onnx +3 -0
- onnx/decoder_with_past_model_bnb4.onnx +3 -0
- onnx/decoder_with_past_model_fp16.onnx +3 -0
- onnx/decoder_with_past_model_int8.onnx +3 -0
- onnx/decoder_with_past_model_q4.onnx +3 -0
- onnx/decoder_with_past_model_quantized.onnx +3 -0
- onnx/decoder_with_past_model_uint8.onnx +3 -0
- onnx/embed_tokens_bnb4.onnx +3 -0
- onnx/embed_tokens_fp16.onnx +3 -0
- onnx/embed_tokens_int8.onnx +3 -0
- onnx/embed_tokens_q4.onnx +3 -0
- onnx/embed_tokens_quantized.onnx +3 -0
- onnx/embed_tokens_uint8.onnx +3 -0
- onnx/encoder_model_bnb4.onnx +3 -0
- onnx/encoder_model_fp16.onnx +3 -0
- onnx/encoder_model_int8.onnx +3 -0
- onnx/encoder_model_q4.onnx +3 -0
- onnx/encoder_model_quantized.onnx +3 -0
- onnx/encoder_model_uint8.onnx +3 -0
- onnx/vision_encoder_bnb4.onnx +3 -0
- onnx/vision_encoder_fp16.onnx +3 -0
- onnx/vision_encoder_int8.onnx +3 -0
- onnx/vision_encoder_q4.onnx +3 -0
- onnx/vision_encoder_quantized.onnx +3 -0
- onnx/vision_encoder_uint8.onnx +3 -0
onnx/decoder_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5f2ebfd6b8b60103b3d60c05ea16e8b092d8f73cafb8478fb0f337c540d7c81
|
3 |
+
size 148757128
|
onnx/decoder_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79e188397967fc26466b9eabc619ff077c4d45b3e4e8ed2b0ea1006bf8e71db7
|
3 |
+
size 510975587
|
onnx/decoder_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab8f1745218d00effaa7ed60af0f08f9a95976fd310c6b2a5d84011e495180e1
|
3 |
+
size 256816021
|
onnx/decoder_model_merged_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18d106d8731c7037a3e7fbfca5a7e0d980866d9f2d84cd67aaecf693355bfd04
|
3 |
+
size 149432159
|
onnx/decoder_model_merged_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87650fad8b38adcc8d668aa33cb6b4c9217abd959644caf29a799a1854cfcdad
|
3 |
+
size 511643557
|
onnx/decoder_model_merged_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:167e7807fb1e5b8d693138f84bc81e1368ea11833264131c1ea96eafc9d13222
|
3 |
+
size 257619824
|
onnx/decoder_model_merged_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:955d6e40a236d4c41237e3fe306c70c66b21cd0a392b976106420a16d42c378f
|
3 |
+
size 165295714
|
onnx/decoder_model_merged_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:167e7807fb1e5b8d693138f84bc81e1368ea11833264131c1ea96eafc9d13222
|
3 |
+
size 257619824
|
onnx/decoder_model_merged_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:693fa1434e574c194d1fe950fd4967f39f4e8a73c6de54c48325c2261edb40be
|
3 |
+
size 257619762
|
onnx/decoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a6e92df993c3563c60ae20aeab251a7318130ecead78fbeac67a40d3c591686
|
3 |
+
size 164621556
|
onnx/decoder_model_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab8f1745218d00effaa7ed60af0f08f9a95976fd310c6b2a5d84011e495180e1
|
3 |
+
size 256816021
|
onnx/decoder_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5287ce86f4660c2a2eb7fbe76b93f4ca3a356c4c7e395cfe4f972c11ef5587ba
|
3 |
+
size 256816076
|
onnx/decoder_with_past_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4d5767c113f78105d69c88efa8c4ceebf19d2e05c98efb6fab2799260d23a3d
|
3 |
+
size 134369341
|
onnx/decoder_with_past_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:509923999d3862e43aa5762677840ba6539719fdb9b6b317687a40d107399c55
|
3 |
+
size 460468797
|
onnx/decoder_with_past_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02a950da82a9dab1f9da784168ba519322b91effa4e84316eac341eff0ee5af3
|
3 |
+
size 231395095
|
onnx/decoder_with_past_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8511e6a4f3a554875c86b09558ae294641e76f4791206a3f4c151c3cc5bb5485
|
3 |
+
size 148661097
|
onnx/decoder_with_past_model_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02a950da82a9dab1f9da784168ba519322b91effa4e84316eac341eff0ee5af3
|
3 |
+
size 231395095
|
onnx/decoder_with_past_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6329230c18c61d77583dd6898494fc767b4c887e8478f35250540ef92e095012
|
3 |
+
size 231395139
|
onnx/embed_tokens_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:503f1caa95e4d122addf94a34d5a7264aa9a9a45a56309fc13d956a016531670
|
3 |
+
size 210080062
|
onnx/embed_tokens_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abd6d8d3ea97655f601ea879aaa4f544a41d5ec567cf422184c4fa12654a14d8
|
3 |
+
size 105040321
|
onnx/embed_tokens_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dab1d09ab449f1302df6e439b35ec9e93fb037134bf6bed9ffeaa93a5b35d43c
|
3 |
+
size 52520480
|
onnx/embed_tokens_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:503f1caa95e4d122addf94a34d5a7264aa9a9a45a56309fc13d956a016531670
|
3 |
+
size 210080062
|
onnx/embed_tokens_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dab1d09ab449f1302df6e439b35ec9e93fb037134bf6bed9ffeaa93a5b35d43c
|
3 |
+
size 52520480
|
onnx/embed_tokens_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75aff02b9806d35d7980f33bd6566c050f70c00d0e527d0ae11217084c95c9d8
|
3 |
+
size 52520479
|
onnx/encoder_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52044faeb83d833ccb29ea269237ec7705a79c98c5881e448c67346d1b8b14b2
|
3 |
+
size 90015331
|
onnx/encoder_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffec954badaf989519d38d07162d58024ec2ee1b0568f622d712bca75b4aebc9
|
3 |
+
size 304634480
|
onnx/encoder_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fe30b02cc8c2247631f8f0b9bc4d6613df1c33da0afe4087abff2f940bc2fe0
|
3 |
+
size 152985855
|
onnx/encoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f61c0650385c82f39573e86d0acf78b05f83d10c9acdbf775dbe342841b8a7e
|
3 |
+
size 99451927
|
onnx/encoder_model_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fe30b02cc8c2247631f8f0b9bc4d6613df1c33da0afe4087abff2f940bc2fe0
|
3 |
+
size 152985855
|
onnx/encoder_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c50292f74b78b4f2d4bfe589c79e51569ae2e093a45fadd5f3af780aca2b4f17
|
3 |
+
size 152985895
|
onnx/vision_encoder_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9b04507da17db548aa1b569e05331e5d749007b3e9967a75d4208a0f3d5574e
|
3 |
+
size 294675311
|
onnx/vision_encoder_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:157849cad88dd9517d5ba02c39ed7542636dbc82f94d98b3cef20331d3b6cc1f
|
3 |
+
size 727422819
|
onnx/vision_encoder_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f76d7178fd95412a438f9d682a36b84f243eec869afa1644e3efbb3b6e9cdfd
|
3 |
+
size 366371735
|
onnx/vision_encoder_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95ad3644965e6253902fa0cc10d8e8af479326ea40add7d221c4d7fd191055dd
|
3 |
+
size 315744349
|
onnx/vision_encoder_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a197b359b7ed8269bcb001ab613800fc16f6f22da86fd77f2d16fa910da33f27
|
3 |
+
size 366371816
|
onnx/vision_encoder_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a197b359b7ed8269bcb001ab613800fc16f6f22da86fd77f2d16fa910da33f27
|
3 |
+
size 366371816
|