add files
Browse files- .gitignore +5 -0
- Makefile +47 -0
- README.md +14 -0
- SHA256SUMS +15 -0
- open-llama-7b-v2-f16.bin +3 -0
- open-llama-7b-v2-q2_K.bin +3 -0
- open-llama-7b-v2-q3_K_L.bin +3 -0
- open-llama-7b-v2-q3_K_M.bin +3 -0
- open-llama-7b-v2-q3_K_S.bin +3 -0
- open-llama-7b-v2-q4_0.bin +3 -0
- open-llama-7b-v2-q4_1.bin +3 -0
- open-llama-7b-v2-q4_K_M.bin +3 -0
- open-llama-7b-v2-q4_K_S.bin +3 -0
- open-llama-7b-v2-q5_0.bin +3 -0
- open-llama-7b-v2-q5_1.bin +3 -0
- open-llama-7b-v2-q5_K_M.bin +3 -0
- open-llama-7b-v2-q5_K_S.bin +3 -0
- open-llama-7b-v2-q6_K.bin +3 -0
- open-llama-7b-v2-q8_0.bin +3 -0
.gitignore
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
llama.cpp/
|
2 |
+
pytorch_model*.bin
|
3 |
+
*.sha
|
4 |
+
*.tar.gz
|
5 |
+
tokenizer.model
|
Makefile
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
MODEL_NAME= open-llama-7b-v2
|
2 |
+
PYTHON?= python
|
3 |
+
LLAMA_TAG= db4047a
|
4 |
+
LLAMA_TAR= master-$(LLAMA_TAG).tar.gz
|
5 |
+
HF_REPO= openlm-research/open_llama_7b_v2
|
6 |
+
HF_REF= main
|
7 |
+
HF_FILES= pytorch_model-00001-of-00002.bin \
|
8 |
+
pytorch_model-00002-of-00002.bin \
|
9 |
+
tokenizer.model
|
10 |
+
$(HF_FILES): SITE= https://huggingface.co/$(HF_REPO)/resolve/$(HF_REF)
|
11 |
+
$(LLAMA_TAR): SITE= https://github.com/ggerganov/llama.cpp/archive/refs/tags
|
12 |
+
|
13 |
+
FILES= $(HF_FILES) $(LLAMA_TAR)
|
14 |
+
|
15 |
+
QUANTS= f16 q4_0 q4_1 q5_0 q5_1 q8_0 \
|
16 |
+
q2_K \
|
17 |
+
q3_K_S q3_K_M q3_K_L \
|
18 |
+
q4_K_S q4_K_M \
|
19 |
+
q5_K_S q5_K_M \
|
20 |
+
q6_K
|
21 |
+
|
22 |
+
MODEL_FILES= $(addsuffix .bin,$(addprefix $(MODEL_NAME)-,$(QUANTS)))
|
23 |
+
|
24 |
+
.PHONY: all
|
25 |
+
all: $(MODEL_FILES) SHA256SUMS
|
26 |
+
|
27 |
+
$(FILES):
|
28 |
+
curl -L -o $@ --url $(SITE)/$@
|
29 |
+
|
30 |
+
llama.cpp: $(LLAMA_TAR)
|
31 |
+
mkdir -p $@
|
32 |
+
tar -xf $< --strip-components=1 -C $@
|
33 |
+
|
34 |
+
llama.cpp/quantize: llama.cpp
|
35 |
+
$(MAKE) -C llama.cpp quantize
|
36 |
+
|
37 |
+
$(MODEL_NAME)-f16.bin: $(HF_FILES) | llama.cpp
|
38 |
+
$(PYTHON) llama.cpp/convert.py --outtype f16 --outfile $@ .
|
39 |
+
|
40 |
+
$(MODEL_NAME)-q%.bin: $(MODEL_NAME)-f16.bin | llama.cpp/quantize
|
41 |
+
llama.cpp/quantize $< $@ q$*
|
42 |
+
|
43 |
+
%.sha: %
|
44 |
+
sha256sum $< > $@
|
45 |
+
|
46 |
+
SHA256SUMS: $(addsuffix .sha,$(MODEL_FILES))
|
47 |
+
cat $^ > $@
|
README.md
CHANGED
@@ -1,3 +1,17 @@
|
|
1 |
---
|
2 |
license: apache-2.0
|
3 |
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
---
|
2 |
license: apache-2.0
|
3 |
---
|
4 |
+
|
5 |
+
# ggml versions of OpenLLaMa 7B v2
|
6 |
+
|
7 |
+
For use with [llama.cpp](https://github.com/ggerganov/llama.cpp).
|
8 |
+
|
9 |
+
- Version: [Final version](https://github.com/openlm-research/open_llama#update-07072023)
|
10 |
+
- Project: [OpenLLaMA: An Open Reproduction of LLaMA](https://github.com/openlm-research/open_llama)
|
11 |
+
- Model: [openlm-research/open_llama_7b_v2](https://huggingface.co/openlm-research/open_llama_7b_v2)
|
12 |
+
- llama.cpp 4,5,8-bit quantization: build 567(2d5db48) or later
|
13 |
+
- llama.cpp newer quantization formats: build 616(99009e7) or later
|
14 |
+
|
15 |
+
## Perplexity
|
16 |
+
|
17 |
+
Coming soon...
|
SHA256SUMS
ADDED
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
e8638da6ae24ead336d7cf11ca822cbc2758ee6eba696259d7f44aacacdae28e open-llama-7b-v2-f16.bin
|
2 |
+
d70bb8fe5eefd194f55cc8dfd9277b57a20d611252d61c7aa2bee18cc9aae44f open-llama-7b-v2-q4_0.bin
|
3 |
+
a7bd7f6d19818ef85f81999965e9706974cfc5c3d2196b407fc1053bc1f0f71a open-llama-7b-v2-q4_1.bin
|
4 |
+
f753d0c9a8d28f4643452d5cb882376f62be295ab88fe41904373c77ec631b0a open-llama-7b-v2-q5_0.bin
|
5 |
+
09cb091143a3cdc70bfa956b49708f3e2b23d286a376b20cce90425f9ea33075 open-llama-7b-v2-q5_1.bin
|
6 |
+
f2e016738892ac755a6bde4a8df435cc574edc26f4023bc6c5d9f865bae30624 open-llama-7b-v2-q8_0.bin
|
7 |
+
af3221bab03e6f8c321d28ac473863b12d6731f29c953f2e529681bdff259718 open-llama-7b-v2-q2_K.bin
|
8 |
+
f6039a48a5763d03c34d7f9f3516e49d44d55364a602944e365d924d280c28c7 open-llama-7b-v2-q3_K_S.bin
|
9 |
+
8dca03aaf8aabaf2e10e6bd02ea33f3909e863d0f0e25e78af7a1ca23b743778 open-llama-7b-v2-q3_K_M.bin
|
10 |
+
b74ce0b75e71a782a947309839cf8a4b989eb9572a352cd9c0c45b5cd62e0a1a open-llama-7b-v2-q3_K_L.bin
|
11 |
+
5de4cd3b6c44bd667324125b5163beed6a9b264360104e6bb0fb39c2538512a8 open-llama-7b-v2-q4_K_S.bin
|
12 |
+
47903d1ce81eca3cd5f985ae5cae82769421d8a687287c8a8471abf9d186214f open-llama-7b-v2-q4_K_M.bin
|
13 |
+
38a4148fad35971d41df5a63d34fb8b538c0f5613736a3a732e36e0a4c1c3cf9 open-llama-7b-v2-q5_K_S.bin
|
14 |
+
993894f8eb588882e1d63b2d1bd285b9d788cd297f2a491dfd62e482da354c08 open-llama-7b-v2-q5_K_M.bin
|
15 |
+
a0be750e3702142b62629e1c7e79c625b1cbf76de1ded8bac1b8bba2e4a23826 open-llama-7b-v2-q6_K.bin
|
open-llama-7b-v2-f16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8638da6ae24ead336d7cf11ca822cbc2758ee6eba696259d7f44aacacdae28e
|
3 |
+
size 13477822624
|
open-llama-7b-v2-q2_K.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af3221bab03e6f8c321d28ac473863b12d6731f29c953f2e529681bdff259718
|
3 |
+
size 2866815136
|
open-llama-7b-v2-q3_K_L.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b74ce0b75e71a782a947309839cf8a4b989eb9572a352cd9c0c45b5cd62e0a1a
|
3 |
+
size 3596828832
|
open-llama-7b-v2-q3_K_M.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8dca03aaf8aabaf2e10e6bd02ea33f3909e863d0f0e25e78af7a1ca23b743778
|
3 |
+
size 3282256032
|
open-llama-7b-v2-q3_K_S.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6039a48a5763d03c34d7f9f3516e49d44d55364a602944e365d924d280c28c7
|
3 |
+
size 2948022432
|
open-llama-7b-v2-q4_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d70bb8fe5eefd194f55cc8dfd9277b57a20d611252d61c7aa2bee18cc9aae44f
|
3 |
+
size 3825524896
|
open-llama-7b-v2-q4_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7bd7f6d19818ef85f81999965e9706974cfc5c3d2196b407fc1053bc1f0f71a
|
3 |
+
size 4238467232
|
open-llama-7b-v2-q4_K_M.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47903d1ce81eca3cd5f985ae5cae82769421d8a687287c8a8471abf9d186214f
|
3 |
+
size 4080722080
|
open-llama-7b-v2-q4_K_S.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5de4cd3b6c44bd667324125b5163beed6a9b264360104e6bb0fb39c2538512a8
|
3 |
+
size 3825524896
|
open-llama-7b-v2-q5_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f753d0c9a8d28f4643452d5cb882376f62be295ab88fe41904373c77ec631b0a
|
3 |
+
size 4651409568
|
open-llama-7b-v2-q5_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09cb091143a3cdc70bfa956b49708f3e2b23d286a376b20cce90425f9ea33075
|
3 |
+
size 5064351904
|
open-llama-7b-v2-q5_K_M.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:993894f8eb588882e1d63b2d1bd285b9d788cd297f2a491dfd62e482da354c08
|
3 |
+
size 4782874784
|
open-llama-7b-v2-q5_K_S.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38a4148fad35971d41df5a63d34fb8b538c0f5613736a3a732e36e0a4c1c3cf9
|
3 |
+
size 4651409568
|
open-llama-7b-v2-q6_K.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0be750e3702142b62629e1c7e79c625b1cbf76de1ded8bac1b8bba2e4a23826
|
3 |
+
size 5528912032
|
open-llama-7b-v2-q8_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2e016738892ac755a6bde4a8df435cc574edc26f4023bc6c5d9f865bae30624
|
3 |
+
size 7129063584
|