Spaces:

mobinln
/

chatbot

Running

mobinln commited on Jun 17

Commit

c2aa89c

•

1 Parent(s): 6da1c26

fix: change to qwen2

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,8 +1,17 @@
 import gradio as gr
 from llama_cpp import Llama
-model = "Qwen/Qwen1.5-0.5B-Chat-GGUF"
-llm = Llama.from_pretrained(repo_id=model, filename="*q8_0.gguf", verbose=True)
 def respond(

 import gradio as gr
 from llama_cpp import Llama
+model = "Qwen/Qwen2-0.5B-Instruct-GGUF"
+llm = Llama.from_pretrained(
+    repo_id=model,
+    filename="*q8_0.gguf",
+    verbose=True,
+    use_mmap=False,
+    use_mlock=True,
+    n_threads=2,
+    n_threads_batch=2,
+    n_ctx=32000,
+)
 def respond(