demoforkakaoapi

Runtime error

ldhldh commited on Oct 5, 2023

Commit

123c1d1

•

1 Parent(s): 48267a7

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,3 +1,5 @@
 from threading import Thread
 from llama_cpp import Llama
 import torch
@@ -9,13 +11,13 @@ print("Running on device:", torch_device)
 print("CPU threads:", torch.get_num_threads())
 llm = Llama(model_path = 'Llama-2-ko-7B-chat-gguf-q4_0.bin',
-            n_ctx=100,
             n_threads = 8,
-            n_batch = 100
       )
 def gen(x, max_new_tokens):
-    output = llm(f"Q: {x} A: ", max_tokens=max_new_tokens, stop=["Q:", "\n"], echo=True)
     return output['choices'][0]['text'].replace('▁',' ')

+!CMAKE_ARGS="-DLLAMA_CUBLAS=on" FORCE_CMAKE=1 pip install --upgrade --force-reinstall llama-cpp-python --no-cache-dir
 from threading import Thread
 from llama_cpp import Llama
 import torch
 print("CPU threads:", torch.get_num_threads())
 llm = Llama(model_path = 'Llama-2-ko-7B-chat-gguf-q4_0.bin',
+            n_ctx=50,
             n_threads = 8,
+            n_batch = 5
       )
 def gen(x, max_new_tokens):
+    output = llm(f"### 명령어:\n{x}\n\n### 응답:", max_tokens=max_new_tokens, stop=["###", "\n", ":"], echo=True)
     return output['choices'][0]['text'].replace('▁',' ')