Update README.md
Browse files
README.md
CHANGED
@@ -58,8 +58,8 @@ from huggingface_hub import hf_hub_download
|
|
58 |
from llama_cpp import Llama
|
59 |
|
60 |
model_path = hf_hub_download(
|
61 |
-
repo_id="MoxoffSpA/
|
62 |
-
filename="
|
63 |
)
|
64 |
|
65 |
# Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.
|
|
|
58 |
from llama_cpp import Llama
|
59 |
|
60 |
model_path = hf_hub_download(
|
61 |
+
repo_id="MoxoffSpA/VolareQuantized",
|
62 |
+
filename="Volare-ggml-Q4_K_M.gguf"
|
63 |
)
|
64 |
|
65 |
# Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.
|