Update README.md
Browse files
README.md
CHANGED
@@ -25,6 +25,7 @@ llm = Llama.from_pretrained(
|
|
25 |
repo_id="abetlen/paligemma-3b-mix-224-gguf",
|
26 |
filename="*text-model-q4_k_m.gguf",
|
27 |
chat_handler=chat_handler,
|
|
|
28 |
n_ctx=2048, # n_ctx should be increased to accommodate the image embedding
|
29 |
n_ubatch=512, # must be large enough to fit image embeddings and text input in a single batch
|
30 |
n_batch=512
|
|
|
25 |
repo_id="abetlen/paligemma-3b-mix-224-gguf",
|
26 |
filename="*text-model-q4_k_m.gguf",
|
27 |
chat_handler=chat_handler,
|
28 |
+
n_gpu_layers=-1,
|
29 |
n_ctx=2048, # n_ctx should be increased to accommodate the image embedding
|
30 |
n_ubatch=512, # must be large enough to fit image embeddings and text input in a single batch
|
31 |
n_batch=512
|