Spaces:

md-vasim
/

llama-2-hf

Runtime error

md-vasim commited on Nov 18, 2023

Commit

a5c729e

•

1 Parent(s): d1caba8

model changed to gguf

Files changed (7) hide show

app/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (159 Bytes). View file

app/__pycache__/views.cpython-310.pyc ADDED Viewed

Binary file (1.36 kB). View file

app/views.py CHANGED Viewed

@@ -39,4 +39,4 @@ with gr.Blocks(
 # mounting at the path
-app = gr.mount_gradio_app(app, llama2bot.queue(concurrency_count=20), path="/llama2")


39
40
41	# mounting at the path
42	+ app = gr.mount_gradio_app(app, llama2bot, path="/llama2")

src/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (159 Bytes). View file

src/__pycache__/chains.cpython-310.pyc ADDED Viewed

Binary file (978 Bytes). View file

src/__pycache__/grutils.cpython-310.pyc ADDED Viewed

Binary file (790 Bytes). View file

src/chains.py CHANGED Viewed

@@ -1,9 +1,14 @@
 from langchain.llms import CTransformers
-from langchain import PromptTemplate, LLMChain
 from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler
-llm = CTransformers(model="TheBloke/Llama-2-7B-Chat-GGML", model_file = 'llama-2-7b-chat.ggmlv3.q2_K.bin', callbacks=[StreamingStdOutCallbackHandler()])
 template = """

 from langchain.llms import CTransformers
+# from langchain import PromptTemplate, LLMChain
+from langchain.chains import LLMChain
+from langchain.prompts import PromptTemplate
 from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler
+ggufmodel = f"TheBloke/Llama-2-7B-Chat-GGUF"
+ggufmodelfile = f"llama-2-7b-chat.Q5_K_M.gguf"
+# llm = CTransformers(model="TheBloke/Llama-2-7B-Chat-GGML", model_file = 'llama-2-7b-chat.ggmlv3.q2_K.bin', callbacks=[StreamingStdOutCallbackHandler()])
+llm = CTransformers(model=ggufmodel, model_file = ggufmodelfile, callbacks=[StreamingStdOutCallbackHandler()])
 template = """