abetlen commited on
Commit
17f3ac9
1 Parent(s): b3ab4c2

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -0
README.md CHANGED
@@ -25,6 +25,7 @@ llm = Llama.from_pretrained(
25
  repo_id="abetlen/paligemma-3b-mix-224-gguf",
26
  filename="*text-model-q4_k_m.gguf",
27
  chat_handler=chat_handler,
 
28
  n_ctx=2048, # n_ctx should be increased to accommodate the image embedding
29
  n_ubatch=512, # must be large enough to fit image embeddings and text input in a single batch
30
  n_batch=512
 
25
  repo_id="abetlen/paligemma-3b-mix-224-gguf",
26
  filename="*text-model-q4_k_m.gguf",
27
  chat_handler=chat_handler,
28
+ n_gpu_layers=-1,
29
  n_ctx=2048, # n_ctx should be increased to accommodate the image embedding
30
  n_ubatch=512, # must be large enough to fit image embeddings and text input in a single batch
31
  n_batch=512