Upload q4f16 ONNX weights
Browse files
onnx/decoder_model_merged_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ceef792245e41918dd2fb0aa7b2a6fb4302bec8c7341cf089a4d3ecbc6d5915d
|
3 |
+
size 146770498
|
onnx/decoder_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8145a13ee4d40712949a5202f63af0d9298f34c9db5b917b25be0be2f95967c
|
3 |
+
size 146089194
|
onnx/decoder_with_past_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2461161368e8eaed4809c7d0c443480250d5f2d058b83af38877bdf8993e9c44
|
3 |
+
size 131753895
|
onnx/embed_tokens_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3677413496147237becbe39cbdb6010f5f6d6ad5f0a0bd3da0746405d2d0301e
|
3 |
+
size 105040340
|
onnx/encoder_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15deb88e3850d01e3a5ff2056c503426bbeb1adf6aa9a7cd9315153ac239cd09
|
3 |
+
size 87590004
|
onnx/vision_encoder_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9aa74cef10bfe9caeef7d1f8420356f9120f75354348ab2f5292004813662d09
|
3 |
+
size 242831340
|