Spaces:
Runtime error
Runtime error
rms_norm_eps 1e-5 for best generation quality
Browse files
app.py
CHANGED
@@ -11,7 +11,7 @@ from llama_cpp import LlamaRAMCache
|
|
11 |
|
12 |
hf_hub_download(repo_id="TheBloke/Llama-2-7B-chat-GGML", filename="llama-2-7b-chat.ggmlv3.q4_K_M.bin", local_dir=".")
|
13 |
|
14 |
-
llm = Llama(model_path="./llama-2-7b-chat.ggmlv3.q4_K_M.bin")
|
15 |
|
16 |
cache = LlamaRAMCache(capacity_bytes=2 << 30)
|
17 |
|
|
|
11 |
|
12 |
hf_hub_download(repo_id="TheBloke/Llama-2-7B-chat-GGML", filename="llama-2-7b-chat.ggmlv3.q4_K_M.bin", local_dir=".")
|
13 |
|
14 |
+
llm = Llama(model_path="./llama-2-7b-chat.ggmlv3.q4_K_M.bin", rms_norm_eps=1e-5)
|
15 |
|
16 |
cache = LlamaRAMCache(capacity_bytes=2 << 30)
|
17 |
|