Spaces:

gufett0
/

chatbot-llamaindex

Sleeping

gufett0 commited on Sep 19, 2024

Commit

6224872

1 Parent(s): 1a9f6cd

hf llm

Files changed (2) hide show

backend.py CHANGED Viewed

@@ -63,7 +63,7 @@ os.environ['TOKENIZERS_PARALLELISM'] = 'false'
 llm = HuggingFaceLLM(
     context_window=4096,
     max_new_tokens=256,
-    generate_kwargs={"temperature": 0.1, "do_sample": True},
     system_prompt=system_prompt,
     tokenizer_name="meta-llama/Llama-2-7b-chat-hf",
     model_name="meta-llama/Llama-2-7b-chat-hf",
@@ -199,7 +199,7 @@ def handle_query(query_str: str,
         verbose=False,
         )"""
         chat_engine = index.as_chat_engine(
         chat_mode="context",
         similarity_top_k=3,

 llm = HuggingFaceLLM(
     context_window=4096,
     max_new_tokens=256,
+    generate_kwargs={"temperature": 0.0, "do_sample": False},
     system_prompt=system_prompt,
     tokenizer_name="meta-llama/Llama-2-7b-chat-hf",
     model_name="meta-llama/Llama-2-7b-chat-hf",
         verbose=False,
         )"""
+        gr.Info("chat engine..")
         chat_engine = index.as_chat_engine(
         chat_mode="context",
         similarity_top_k=3,

requirements.txt CHANGED Viewed

@@ -14,7 +14,7 @@ pypdf
 langchain>=0.2.3
 langchain-community
 langchain-huggingface
-bitsandbytes-cuda117
 accelerate
 gradio
 spaces

 langchain>=0.2.3
 langchain-community
 langchain-huggingface
+bitsandbytes
 accelerate
 gradio
 spaces