AaronHuangWei
commited on
Commit
•
2e82767
1
Parent(s):
87f6ff2
add group precision for some small LLMs
Browse files- block_precision_128_2bit/Llama-2-13b-hf.pt +3 -0
- block_precision_128_2bit/Llama-2-7b-hf.pt +3 -0
- block_precision_128_2bit/Meta-Llama-3-8B.pt +3 -0
- block_precision_128_2bit/llama-13b.pt +3 -0
- block_precision_128_2bit/llama-30b.pt +3 -0
- block_precision_128_2bit/llama-7b.pt +3 -0
- block_precision_128_2bit/opt-1.3b.pt +3 -0
- block_precision_128_2bit/opt-13b.pt +3 -0
- block_precision_128_2bit/opt-2.7b.pt +3 -0
- block_precision_128_2bit/opt-30b.pt +3 -0
- block_precision_128_2bit/opt-6.7b.pt +3 -0
- block_precision_128_3bit/Llama-2-13b-hf.pt +3 -0
- block_precision_128_3bit/Llama-2-7b-hf.pt +3 -0
- block_precision_128_3bit/Meta-Llama-3-8B.pt +3 -0
- block_precision_128_3bit/llama-13b.pt +3 -0
- block_precision_128_3bit/llama-30b.pt +3 -0
- block_precision_128_3bit/llama-7b.pt +3 -0
- block_precision_128_3bit/opt-1.3b.pt +3 -0
- block_precision_128_3bit/opt-13b.pt +3 -0
- block_precision_128_3bit/opt-2.7b.pt +3 -0
- block_precision_128_3bit/opt-30b.pt +3 -0
- block_precision_128_3bit/opt-6.7b.pt +3 -0
- block_precision_256_3bit/Llama-2-7b-hf.pt +3 -0
- block_precision_256_3bit/Meta-Llama-3-8B.pt +3 -0
- block_precision_256_3bit/llama-7b.pt +3 -0
- block_precision_256_3bit/opt-6.7b.pt +3 -0
- block_precision_64_2bit/Meta-Llama-3-8B.pt +3 -0
- block_precision_64_2bit/llama-13b.pt +3 -0
- block_precision_64_2bit/opt-1.3b.pt +3 -0
- block_precision_64_2bit/opt-13b.pt +3 -0
- block_precision_64_2bit/opt-2.7b.pt +3 -0
- block_precision_64_2bit/opt-6.7b.pt +3 -0
block_precision_128_2bit/Llama-2-13b-hf.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50ace2723eab72b3dc93d25ec5e7690a94915fde303500af09c3ef596d6aa9e7
|
3 |
+
size 37436
|
block_precision_128_2bit/Llama-2-7b-hf.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74d427e59926a19ac81cac73ca7fd3e9b61d148fd6e4d7e8c74f47425a3e3763
|
3 |
+
size 25464
|
block_precision_128_2bit/Meta-Llama-3-8B.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2a2637031f304fa9c9bcdbd0dc1b88ed39917cd54a82d7e0ecf871d52fea4e5
|
3 |
+
size 27136
|
block_precision_128_2bit/llama-13b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c625461f062e95aad45f7ef26b87938f4708dfd6fd74cc7b20cce32f86de5a47
|
3 |
+
size 37416
|
block_precision_128_2bit/llama-30b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cd989ba0056baa39b30f10b03d9a146e4ff881762573841d0ca82175b5fc370
|
3 |
+
size 68520
|
block_precision_128_2bit/llama-7b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1bb27058b1c5e3fb361493353ac25248b967f74a6455424fbc78a355d2ec7bf
|
3 |
+
size 25444
|
block_precision_128_2bit/opt-1.3b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13f27358ee34fc1609e81a7adef62ba3feba53c65cc9fdde6fee4e4f9380a424
|
3 |
+
size 11044
|
block_precision_128_2bit/opt-13b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2797b1f926b22090f95107219ce19f5a22ee99e751779dfa850301a6313354e
|
3 |
+
size 35616
|
block_precision_128_2bit/opt-2.7b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:743bd595c7c18dff043c4bb68aa7fe8af28166ea4bcaec4a5911d64b2c29fef8
|
3 |
+
size 16996
|
block_precision_128_2bit/opt-30b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcb04a39aaa61f0322e94d28fef9e92062062cb0f74045ccd42ef4d94d107acf
|
3 |
+
size 56544
|
block_precision_128_2bit/opt-6.7b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6792687975832480810d011fa33b6c2be56aeff82bdc460de9128b1793f131b3
|
3 |
+
size 23908
|
block_precision_128_3bit/Llama-2-13b-hf.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd481b8462d35e0ed8755bb277ebc852075801740f5ad37cdaebd93f7c5382e7
|
3 |
+
size 37436
|
block_precision_128_3bit/Llama-2-7b-hf.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a09f3f2fd6fcc9b92a801a3dc6b8f75c0ad5b087bb9c4131b120b85c3bce684a
|
3 |
+
size 25464
|
block_precision_128_3bit/Meta-Llama-3-8B.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:771f30bf69190eff3c49b1b9a643a33f1a3525317ff1d7d2f6c67ecb99e58a0d
|
3 |
+
size 27136
|
block_precision_128_3bit/llama-13b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e25d6c5d41d50e5c30731c206101547a1426b7bdf3ed184409ee8a755e078061
|
3 |
+
size 37416
|
block_precision_128_3bit/llama-30b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:528d7085dbf55ad70f433d47e72415074d7b28dd9b0cee08b4d64e0e1e316ad4
|
3 |
+
size 68520
|
block_precision_128_3bit/llama-7b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03f6ce57ad9805a18d665f24d596f1a2ce942f040f098b999313484550a0e88c
|
3 |
+
size 25444
|
block_precision_128_3bit/opt-1.3b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c87616e75b42d5bb3663b772ec1e3938411b228e2dce751a6cfe05a65a16bb00
|
3 |
+
size 11044
|
block_precision_128_3bit/opt-13b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b139a7dd7f6249f6471f5114d0fdaf8c69e8313f462f3cc732420113e9ce8f5
|
3 |
+
size 35616
|
block_precision_128_3bit/opt-2.7b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ec8815cf7c18d64af051bf53ddae37f299d66bed85b8954632ec90c5484cd92
|
3 |
+
size 16996
|
block_precision_128_3bit/opt-30b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d51a7dccbf8b8b12ab6f6969dc8a8956e7dde417798b83d1448a023b78c18dcb
|
3 |
+
size 56544
|
block_precision_128_3bit/opt-6.7b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d912b12a73c664d11bf1dfc08b42db1d2c81e342c0a6698c65e7e87889189b47
|
3 |
+
size 23908
|
block_precision_256_3bit/Llama-2-7b-hf.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b98a948ff7005135a97a99f7db904aee57cfaf38f20f26efe5fc4311761caf4
|
3 |
+
size 16568
|
block_precision_256_3bit/Meta-Llama-3-8B.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8923fb47e87971b8a4a36225f742beae39f38278fc84a0da5c25ad2acdff598
|
3 |
+
size 17408
|
block_precision_256_3bit/llama-7b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a4df4de9cc497c4f151720754b91417fe769a42e33a253ce0a4a80d3610fd06
|
3 |
+
size 16548
|
block_precision_256_3bit/opt-6.7b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be20d3499f001c3de9ba7bf4b460168c23af140941d093f193f61fb21ea24288
|
3 |
+
size 14692
|
block_precision_64_2bit/Meta-Llama-3-8B.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c3a52d946f8e72b893e72b80066c547144445fff3161e07552bc5f86e3ecb30
|
3 |
+
size 46592
|
block_precision_64_2bit/llama-13b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbad18ce48537e48d17758252ba04c0e3ab46e6bf96cde6723acd14b75993c3b
|
3 |
+
size 65256
|
block_precision_64_2bit/opt-1.3b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b458688bf5e862a0afd9af5882098045c2b5c1e65a1639ae6dad52a60a2c2e2c
|
3 |
+
size 17956
|
block_precision_64_2bit/opt-13b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f362d2dc57e3cf1aef0141dd5d1d7f5bfc0430efe52e29d3bbf0ce294c735138
|
3 |
+
size 64416
|
block_precision_64_2bit/opt-2.7b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30b17baae81f4bae088ff7cfc8d5f074299b89388a48798720e320b781eb8a21
|
3 |
+
size 28516
|
block_precision_64_2bit/opt-6.7b.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e7c846fad90ce08db87e0518cce83c7999b0be906e9c69f32af194ac3dbdbd6
|
3 |
+
size 42340
|