Spaces:

isayahc
/

sample_name

Runtime error

isayahc commited on Nov 15, 2023

Commit

91bdf3d

•

1 Parent(s): a3a6d28

Update app.py

attempting to get model to work

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,13 +6,22 @@ from langchain.embeddings import HuggingFaceBgeEmbeddings
 from langchain.chains import RetrievalQA
 import gradio as gr
-local_llm = "https://huggingface.co/TheBloke/zephyr-7B-beta-GGUF/blob/main/zephyr-7b-beta.Q5_K_S.gguf"
 # Load model directly
 # from transformers import AutoModel
 # local_llm = AutoModel.from_pretrained("TheBloke/zephyr-7B-beta-GGUF")
 config = {
     "max_new_token": 1024,
     "repetition_penalty": 1.1,

 from langchain.chains import RetrievalQA
 import gradio as gr
+# local_llm = "https://huggingface.co/TheBloke/zephyr-7B-beta-GGUF/blob/main/zephyr-7b-beta.Q5_K_S.gguf"
 # Load model directly
 # from transformers import AutoModel
 # local_llm = AutoModel.from_pretrained("TheBloke/zephyr-7B-beta-GGUF")
+local_llm = CTransformers(
+    model = "TheBloke/zephyr-7B-beta-GGUF",
+    model_file = "zephyr-7b-beta.Q4_0.gguf",
+    model_type="mistral",
+    lib="avx2", #for CPU use
+    **config
+)
 config = {
     "max_new_token": 1024,
     "repetition_penalty": 1.1,