Update app.py
Browse files
app.py
CHANGED
@@ -451,7 +451,7 @@ llm = Llama(
|
|
451 |
model_path=true_path, # Download the model file first
|
452 |
n_ctx=8000, # The max sequence length to use - note that longer sequence lengths require much more resources
|
453 |
n_threads=8, # The number of CPU threads to use, tailor to your system and the resulting performance
|
454 |
-
n_gpu_layers=-1, # The number of layers to offload to GPU, if you have GPU acceleration available
|
455 |
chat_format="llama-2"
|
456 |
)
|
457 |
|
|
|
451 |
model_path=true_path, # Download the model file first
|
452 |
n_ctx=8000, # The max sequence length to use - note that longer sequence lengths require much more resources
|
453 |
n_threads=8, # The number of CPU threads to use, tailor to your system and the resulting performance
|
454 |
+
#n_gpu_layers=-1, # The number of layers to offload to GPU, if you have GPU acceleration available
|
455 |
chat_format="llama-2"
|
456 |
)
|
457 |
|