Xenova HF staff commited on
Commit
33593c6
1 Parent(s): 1db03f4

Upload quantized ONNX weights (#1)

Browse files

- Upload quantized ONNX weights (8269fb6446908654d8926eb386520ad337d3d516)

onnx/decoder_model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff0b9cfbee73984dfc10833ef5be99a6485f15ecac770f119997b98c75da39ed
3
+ size 148757128
onnx/decoder_model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:059a04344350e80eec87b7a360f77d6d9de27817ebd7ed109f004469b043151f
3
+ size 510975587
onnx/decoder_model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f0f6cd83c057df5da5a0586d3c5483d9135d17537ec876bb8e8ebbf42627f7e
3
+ size 256816021
onnx/decoder_model_merged_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96e701c77fc34737334ed853c07365b2329fe7a2b6a80388b51158e7471e38f0
3
+ size 149432159
onnx/decoder_model_merged_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f007b050621cd1b60392f25a4fe837fb2eda425c11580edd376acc77a369b9b
3
+ size 511643557
onnx/decoder_model_merged_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a87417445e9ecbf0adb68ac0c2c86a7a05f7415b41a45404152528c2dc5d494
3
+ size 257619797
onnx/decoder_model_merged_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d13b29ac7da5a998c73d9d8bf9e9380425dc5d03398a82507831651e1a47a374
3
+ size 165295714
onnx/decoder_model_merged_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a87417445e9ecbf0adb68ac0c2c86a7a05f7415b41a45404152528c2dc5d494
3
+ size 257619797
onnx/decoder_model_merged_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68d47062b82f1ae06eeab32445b25b77c07fc4ee97ae636b7fba6185044df6ea
3
+ size 257619768
onnx/decoder_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83cb8cead83f91d5c5e4c1ac6a3e20073f96cc9512a6a032c70c2eb704dc21e0
3
+ size 164621556
onnx/decoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f0f6cd83c057df5da5a0586d3c5483d9135d17537ec876bb8e8ebbf42627f7e
3
+ size 256816021
onnx/decoder_model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70eed266a19fd4e2d981209232da882431bc2b378cea0921d8db1ac821a53d55
3
+ size 256816082
onnx/decoder_with_past_model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c8c17a4be4f6ebb98907194424c77733427441c120065fd4e0ca564a2126be0
3
+ size 134368512
onnx/decoder_with_past_model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7675346298bd4d5a2c3951346e4aa896c2f5f84d28d07fab261291f20d444505
3
+ size 460467968
onnx/decoder_with_past_model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:269740e47586ab594ba6e5f36b3582e18394fde8b04846bd2e6a3bc4be21d2dd
3
+ size 231394266
onnx/decoder_with_past_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a39fca9b7151371ba1f8f78f6e531abfd1cbf9521d5f9597027185ade16ea57
3
+ size 148660268
onnx/decoder_with_past_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:269740e47586ab594ba6e5f36b3582e18394fde8b04846bd2e6a3bc4be21d2dd
3
+ size 231394266
onnx/decoder_with_past_model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:537ce27eb955ec77e1ca54476a75c3fd82c602dcc52d554aeffc78a6e03b3e24
3
+ size 231394313
onnx/embed_tokens_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e2d2d452503b2c75683f21e96659a13b3c3da1561ca59a5294ee35f9f49b78c
3
+ size 210080062
onnx/embed_tokens_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:661859f77f1b3f9d2bcdd8eb4fc6e611f48c51abdc55af67de1aa2e0e466ccda
3
+ size 105040321
onnx/embed_tokens_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f64649977559f0f88c5beed562d1f4c1f946f4831d17afe433f2d76a7da2fb6
3
+ size 52520480
onnx/embed_tokens_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e2d2d452503b2c75683f21e96659a13b3c3da1561ca59a5294ee35f9f49b78c
3
+ size 210080062
onnx/embed_tokens_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f64649977559f0f88c5beed562d1f4c1f946f4831d17afe433f2d76a7da2fb6
3
+ size 52520480
onnx/embed_tokens_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70516a87d14ce774a15ca5ec0d8c2bc58c44552959e372196b741bfaa1c3eb70
3
+ size 52520479
onnx/encoder_model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7a71f51c0be8ff2de5bdb19e1c76344d2657c9cc3e0fd29c7280feb7ace1df8
3
+ size 90015331
onnx/encoder_model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53211b7c6fd8dc63422d7423fe637fc7debea665996c08a31352943c2e96b231
3
+ size 304634480
onnx/encoder_model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10f49539850b62d21b80f1d0950359aa6b5e6801378fa8aa968a5eaf2f449448
3
+ size 152985855
onnx/encoder_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa3fdccdbab224adcfbf3c5df7a95ea89cdffc7e917bac9f8a7879b94560c1f0
3
+ size 99451927
onnx/encoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10f49539850b62d21b80f1d0950359aa6b5e6801378fa8aa968a5eaf2f449448
3
+ size 152985855
onnx/encoder_model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6eb30cf8a1ff4af6e79b9858494331a122ac919f7b430bbe41c7f6e22d75d8a2
3
+ size 152985897
onnx/vision_encoder_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3e8e06be761ac08da0fb35f8cf3f2ebea3e9f2cb4a8cc08caefd2119e02fbc8
3
+ size 294675311
onnx/vision_encoder_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e5a26503ed487facd4459cfac85513b6c917dabd021c5ed141f283a0c7e8514
3
+ size 727422819
onnx/vision_encoder_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba1f4c8ca1fcfb0007defae0827a2528f388af79b9f000881d573796af40bb80
3
+ size 366371735
onnx/vision_encoder_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd2949cc69b4ffaaa135e813a0ede5f864a3084322565fafec95eaf17bd304e9
3
+ size 315744349
onnx/vision_encoder_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74aa56d21ce306d559bb8ddef99cf04915c14fd9aa0452f9e39914d5a859fb4e
3
+ size 366371812
onnx/vision_encoder_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74aa56d21ce306d559bb8ddef99cf04915c14fd9aa0452f9e39914d5a859fb4e
3
+ size 366371812