Update app.py
Browse files
app.py
CHANGED
|
@@ -23,8 +23,10 @@ print(f"Model downloaded to: {model_path}")
|
|
| 23 |
|
| 24 |
llm = Llama(
|
| 25 |
model_path=model_path,
|
|
|
|
|
|
|
| 26 |
n_gpu_layers=0, # GPU acceleration if available
|
| 27 |
-
n_ctx=
|
| 28 |
chat_format="llama-3",
|
| 29 |
)
|
| 30 |
|
|
|
|
| 23 |
|
| 24 |
llm = Llama(
|
| 25 |
model_path=model_path,
|
| 26 |
+
n_threads=2,
|
| 27 |
+
n_batch=256,
|
| 28 |
n_gpu_layers=0, # GPU acceleration if available
|
| 29 |
+
n_ctx=2048,
|
| 30 |
chat_format="llama-3",
|
| 31 |
)
|
| 32 |
|