Spaces:

vishwask
/

witp_poc

Paused

App Files Files Community

vishwask commited on Oct 13, 2023

Commit

75ded75

•

1 Parent(s): 6d9ed4f

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -10

app.py CHANGED Viewed

@@ -48,8 +48,8 @@ def load_model(_docs):
     text_splitter = RecursiveCharacterTextSplitter(chunk_size=1024, chunk_overlap=256)
     texts = text_splitter.split_documents(docs)
     db = FAISS.from_documents(texts, embeddings)
-    model_name_or_path = "/home/user/app/Llama-2-13B-chat-GPTQ/"
-    #model_name_or_path = "/home/user/app/codeLlama"
     model_basename = "model"
@@ -57,8 +57,8 @@ def load_model(_docs):
     model = AutoGPTQForCausalLM.from_quantized(
         model_name_or_path,
-        revision="gptq-8bit-128g-actorder_False",
-        #revision="gptq-8bit-128g-actorder_True",
         model_basename=model_basename,
         use_safetensors=True,
         trust_remote_code=True,
@@ -105,12 +105,12 @@ def load_model(_docs):
                              streamer=streamer,)
     llm = HuggingFacePipeline(pipeline=text_pipeline, model_kwargs={"temperature": 0.1})
-    SYSTEM_PROMPT = ("Use the following pieces of context to answer the question at the end. "
-                     "If you don't know the answer, just say that you don't know, "
-                     "don't try to make up an answer.")
-    # SYSTEM_PROMPT = ("Use the following pieces of context along with general information you possess to answer the question at the end."
-    #              "If you don't know the answer, just say that you don't know, "
-    #              "don't try to make up an answer. Answer what is asked strictly and do not provide further questions at all.")
     template = generate_prompt("""{context}  Question: {question} """,system_prompt=SYSTEM_PROMPT,) #Enter memory here!
     prompt = PromptTemplate(template=template, input_variables=["context",  "question"]) #Add history here

     text_splitter = RecursiveCharacterTextSplitter(chunk_size=1024, chunk_overlap=256)
     texts = text_splitter.split_documents(docs)
     db = FAISS.from_documents(texts, embeddings)
+    #model_name_or_path = "/home/user/app/Llama-2-13B-chat-GPTQ/"
+    #model_name_or_path = "/home/user/app/codeLlama/"
     model_basename = "model"
     model = AutoGPTQForCausalLM.from_quantized(
         model_name_or_path,
+        #revision="gptq-8bit-128g-actorder_False",
+        revision="gptq-8bit-128g-actorder_True",
         model_basename=model_basename,
         use_safetensors=True,
         trust_remote_code=True,
                              streamer=streamer,)
     llm = HuggingFacePipeline(pipeline=text_pipeline, model_kwargs={"temperature": 0.1})
+    # SYSTEM_PROMPT = ("Use the following pieces of context to answer the question at the end. "
+    #                  "If you don't know the answer, just say that you don't know, "
+    #                  "don't try to make up an answer.")
+    SYSTEM_PROMPT = ("Use the following pieces of context along with general information you possess to answer the question at the end."
+                 "If you don't know the answer, just say that you don't know, "
+                 "don't try to make up an answer.")
     template = generate_prompt("""{context}  Question: {question} """,system_prompt=SYSTEM_PROMPT,) #Enter memory here!
     prompt = PromptTemplate(template=template, input_variables=["context",  "question"]) #Add history here