MoxoffSrL
/

VolareQuantized

Text Generation

Inference Endpoints

Model card Files Files and versions Community

marcodambra commited on Apr 16, 2024

Commit

2ec4a6e

·

verified ·

1 Parent(s): 6b2d485

Update README.md

Files changed (1) hide show

README.md +2 -2

README.md CHANGED Viewed

@@ -58,8 +58,8 @@ from huggingface_hub import hf_hub_download
 from llama_cpp import Llama
 model_path = hf_hub_download(
-    repo_id="MoxoffSpA/AzzurroQuantized",
-    filename="Azzurro-ggml-Q4_K_M.gguf"
 )
 # Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.

 from llama_cpp import Llama
 model_path = hf_hub_download(
+    repo_id="MoxoffSpA/VolareQuantized",
+    filename="Volare-ggml-Q4_K_M.gguf"
 )
 # Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.