SlyEcho commited on
Commit
e0a9bc8
1 Parent(s): 847ed16
.gitignore ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ llama.cpp/
2
+ pytorch_model*.bin
3
+ *.sha
4
+ *.tar.gz
5
+ tokenizer.model
Makefile ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ MODEL_NAME= open-llama-7b-v2
2
+ PYTHON?= python
3
+ LLAMA_TAG= db4047a
4
+ LLAMA_TAR= master-$(LLAMA_TAG).tar.gz
5
+ HF_REPO= openlm-research/open_llama_7b_v2
6
+ HF_REF= main
7
+ HF_FILES= pytorch_model-00001-of-00002.bin \
8
+ pytorch_model-00002-of-00002.bin \
9
+ tokenizer.model
10
+ $(HF_FILES): SITE= https://huggingface.co/$(HF_REPO)/resolve/$(HF_REF)
11
+ $(LLAMA_TAR): SITE= https://github.com/ggerganov/llama.cpp/archive/refs/tags
12
+
13
+ FILES= $(HF_FILES) $(LLAMA_TAR)
14
+
15
+ QUANTS= f16 q4_0 q4_1 q5_0 q5_1 q8_0 \
16
+ q2_K \
17
+ q3_K_S q3_K_M q3_K_L \
18
+ q4_K_S q4_K_M \
19
+ q5_K_S q5_K_M \
20
+ q6_K
21
+
22
+ MODEL_FILES= $(addsuffix .bin,$(addprefix $(MODEL_NAME)-,$(QUANTS)))
23
+
24
+ .PHONY: all
25
+ all: $(MODEL_FILES) SHA256SUMS
26
+
27
+ $(FILES):
28
+ curl -L -o $@ --url $(SITE)/$@
29
+
30
+ llama.cpp: $(LLAMA_TAR)
31
+ mkdir -p $@
32
+ tar -xf $< --strip-components=1 -C $@
33
+
34
+ llama.cpp/quantize: llama.cpp
35
+ $(MAKE) -C llama.cpp quantize
36
+
37
+ $(MODEL_NAME)-f16.bin: $(HF_FILES) | llama.cpp
38
+ $(PYTHON) llama.cpp/convert.py --outtype f16 --outfile $@ .
39
+
40
+ $(MODEL_NAME)-q%.bin: $(MODEL_NAME)-f16.bin | llama.cpp/quantize
41
+ llama.cpp/quantize $< $@ q$*
42
+
43
+ %.sha: %
44
+ sha256sum $< > $@
45
+
46
+ SHA256SUMS: $(addsuffix .sha,$(MODEL_FILES))
47
+ cat $^ > $@
README.md CHANGED
@@ -1,3 +1,17 @@
1
  ---
2
  license: apache-2.0
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
  license: apache-2.0
3
  ---
4
+
5
+ # ggml versions of OpenLLaMa 7B v2
6
+
7
+ For use with [llama.cpp](https://github.com/ggerganov/llama.cpp).
8
+
9
+ - Version: [Final version](https://github.com/openlm-research/open_llama#update-07072023)
10
+ - Project: [OpenLLaMA: An Open Reproduction of LLaMA](https://github.com/openlm-research/open_llama)
11
+ - Model: [openlm-research/open_llama_7b_v2](https://huggingface.co/openlm-research/open_llama_7b_v2)
12
+ - llama.cpp 4,5,8-bit quantization: build 567(2d5db48) or later
13
+ - llama.cpp newer quantization formats: build 616(99009e7) or later
14
+
15
+ ## Perplexity
16
+
17
+ Coming soon...
SHA256SUMS ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ e8638da6ae24ead336d7cf11ca822cbc2758ee6eba696259d7f44aacacdae28e open-llama-7b-v2-f16.bin
2
+ d70bb8fe5eefd194f55cc8dfd9277b57a20d611252d61c7aa2bee18cc9aae44f open-llama-7b-v2-q4_0.bin
3
+ a7bd7f6d19818ef85f81999965e9706974cfc5c3d2196b407fc1053bc1f0f71a open-llama-7b-v2-q4_1.bin
4
+ f753d0c9a8d28f4643452d5cb882376f62be295ab88fe41904373c77ec631b0a open-llama-7b-v2-q5_0.bin
5
+ 09cb091143a3cdc70bfa956b49708f3e2b23d286a376b20cce90425f9ea33075 open-llama-7b-v2-q5_1.bin
6
+ f2e016738892ac755a6bde4a8df435cc574edc26f4023bc6c5d9f865bae30624 open-llama-7b-v2-q8_0.bin
7
+ af3221bab03e6f8c321d28ac473863b12d6731f29c953f2e529681bdff259718 open-llama-7b-v2-q2_K.bin
8
+ f6039a48a5763d03c34d7f9f3516e49d44d55364a602944e365d924d280c28c7 open-llama-7b-v2-q3_K_S.bin
9
+ 8dca03aaf8aabaf2e10e6bd02ea33f3909e863d0f0e25e78af7a1ca23b743778 open-llama-7b-v2-q3_K_M.bin
10
+ b74ce0b75e71a782a947309839cf8a4b989eb9572a352cd9c0c45b5cd62e0a1a open-llama-7b-v2-q3_K_L.bin
11
+ 5de4cd3b6c44bd667324125b5163beed6a9b264360104e6bb0fb39c2538512a8 open-llama-7b-v2-q4_K_S.bin
12
+ 47903d1ce81eca3cd5f985ae5cae82769421d8a687287c8a8471abf9d186214f open-llama-7b-v2-q4_K_M.bin
13
+ 38a4148fad35971d41df5a63d34fb8b538c0f5613736a3a732e36e0a4c1c3cf9 open-llama-7b-v2-q5_K_S.bin
14
+ 993894f8eb588882e1d63b2d1bd285b9d788cd297f2a491dfd62e482da354c08 open-llama-7b-v2-q5_K_M.bin
15
+ a0be750e3702142b62629e1c7e79c625b1cbf76de1ded8bac1b8bba2e4a23826 open-llama-7b-v2-q6_K.bin
open-llama-7b-v2-f16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8638da6ae24ead336d7cf11ca822cbc2758ee6eba696259d7f44aacacdae28e
3
+ size 13477822624
open-llama-7b-v2-q2_K.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af3221bab03e6f8c321d28ac473863b12d6731f29c953f2e529681bdff259718
3
+ size 2866815136
open-llama-7b-v2-q3_K_L.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74ce0b75e71a782a947309839cf8a4b989eb9572a352cd9c0c45b5cd62e0a1a
3
+ size 3596828832
open-llama-7b-v2-q3_K_M.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dca03aaf8aabaf2e10e6bd02ea33f3909e863d0f0e25e78af7a1ca23b743778
3
+ size 3282256032
open-llama-7b-v2-q3_K_S.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6039a48a5763d03c34d7f9f3516e49d44d55364a602944e365d924d280c28c7
3
+ size 2948022432
open-llama-7b-v2-q4_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d70bb8fe5eefd194f55cc8dfd9277b57a20d611252d61c7aa2bee18cc9aae44f
3
+ size 3825524896
open-llama-7b-v2-q4_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7bd7f6d19818ef85f81999965e9706974cfc5c3d2196b407fc1053bc1f0f71a
3
+ size 4238467232
open-llama-7b-v2-q4_K_M.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47903d1ce81eca3cd5f985ae5cae82769421d8a687287c8a8471abf9d186214f
3
+ size 4080722080
open-llama-7b-v2-q4_K_S.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5de4cd3b6c44bd667324125b5163beed6a9b264360104e6bb0fb39c2538512a8
3
+ size 3825524896
open-llama-7b-v2-q5_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f753d0c9a8d28f4643452d5cb882376f62be295ab88fe41904373c77ec631b0a
3
+ size 4651409568
open-llama-7b-v2-q5_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09cb091143a3cdc70bfa956b49708f3e2b23d286a376b20cce90425f9ea33075
3
+ size 5064351904
open-llama-7b-v2-q5_K_M.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:993894f8eb588882e1d63b2d1bd285b9d788cd297f2a491dfd62e482da354c08
3
+ size 4782874784
open-llama-7b-v2-q5_K_S.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38a4148fad35971d41df5a63d34fb8b538c0f5613736a3a732e36e0a4c1c3cf9
3
+ size 4651409568
open-llama-7b-v2-q6_K.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0be750e3702142b62629e1c7e79c625b1cbf76de1ded8bac1b8bba2e4a23826
3
+ size 5528912032
open-llama-7b-v2-q8_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2e016738892ac755a6bde4a8df435cc574edc26f4023bc6c5d9f865bae30624
3
+ size 7129063584