Upload optimized ONNX files w/ GQA
Browse files
onnx/decoder_model_merged_fp16.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91fe49a027c173c2ee620da92291c47cc559a283d642a792b75c1d055d2b042a
|
3 |
+
size 546702655
|
onnx/decoder_model_merged_q4f16.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76bbee9e65863a1b393a1c406f132164d98aa58fcdc9c983f85b069c13c295f5
|
3 |
+
size 739917135
|