Spaces:

spark-ds549
/

LibRAG

Runtime error

App Files Files Community

Dephoh commited on Dec 10, 2024

Commit

fa714bc

1 Parent(s): 16f0715

transferring initializations to st.session_state

Browse files

Files changed (2) hide show

RAG.py +1 -2
streamlit_app.py +29 -31

RAG.py CHANGED Viewed

@@ -118,7 +118,7 @@ def parse_xml_and_check(xml_string: str) -> str:
     return parsed_response.get('RESPONSE', "No response found in the output")
-def RAG(llm: Any, query: str, index_name: str, embeddings: Any,vectorstore:PineconeVectorStore, top: int = 10, k: int = 100) -> Tuple[str, List[Document]]:
     """Main RAG function with improved error handling and validation."""
     start = time.time()
     try:
@@ -147,7 +147,6 @@ def RAG(llm: Any, query: str, index_name: str, embeddings: Any,vectorstore:Pinec
             <QUERY>{query}</QUERY>
             """
         )
         query_prompt = query_template.invoke({"query":query})
         query_response = llm.invoke(query_prompt)

     return parsed_response.get('RESPONSE', "No response found in the output")
+def RAG(llm: Any, query: str,vectorstore:PineconeVectorStore, top: int = 10, k: int = 100) -> Tuple[str, List[Document]]:
     """Main RAG function with improved error handling and validation."""
     start = time.time()
     try:
             <QUERY>{query}</QUERY>
             """
         )
         query_prompt = query_template.invoke({"query":query})
         query_response = llm.invoke(query_prompt)

streamlit_app.py CHANGED Viewed

@@ -26,20 +26,29 @@ def initialize_models() -> Tuple[Optional[ChatOpenAI], HuggingFaceEmbeddings]:
     try:
         load_dotenv()
-        # Initialize OpenAI model
-        llm = ChatOpenAI(
-            model="gpt-4",  # Changed from gpt-4o-mini which appears to be a typo
-            temperature=0,
-            timeout=60,  # Added reasonable timeout
-            max_retries=2
-        )
-        # Initialize embeddings
-        embeddings = HuggingFaceEmbeddings(
-            model_name="sentence-transformers/all-MiniLM-L6-v2"
-        )
-        return llm, embeddings
     except Exception as e:
         logger.error(f"Error initializing models: {str(e)}")
@@ -90,35 +99,24 @@ def display_sources(sources: List) -> None:
             st.error(f"Error displaying source {i}")
 def main():
-    st.title("RAG Chatbot")
     INDEX_NAME = 'bpl-rag'
-    pinecone_api_key = os.getenv("PINECONE_API_KEY")
     # Initialize session state
     if "messages" not in st.session_state:
         st.session_state.messages = []
     # Initialize models
-    llm, embeddings = initialize_models()
-    if not llm or not embeddings:
-        st.error("Failed to initialize the application. Please check the logs.")
-        return
-    #initialize vectorstore
-    pc = Pinecone(api_key=pinecone_api_key)
-    index = pc.Index(INDEX_NAME)
-    vector_store = PineconeVectorStore(index=index, embedding=embeddings)
     # Display chat history
     for message in st.session_state.messages:
         with st.chat_message(message["role"]):
             st.markdown(message["content"])
     # Chat input
-    user_input = st.chat_input("Type your message here...")
     if user_input:
         # Display user message
         with st.chat_message("user"):
@@ -130,10 +128,10 @@ def main():
             with st.spinner("Let Me Think..."):
                 response, sources = process_message(
                     query=user_input,
-                    llm=llm,
                     index_name=INDEX_NAME,
-                    embeddings=embeddings,
-                    vectorstore=vector_store
                 )
                 if isinstance(response, str):

     try:
         load_dotenv()
+        if "llm" not in st.session_state:
+            # Initialize OpenAI model
+            st.session_state.llm = ChatOpenAI(
+                model="gpt-4",  # Changed from gpt-4o-mini which appears to be a typo
+                temperature=0,
+                timeout=60,  # Added reasonable timeout
+                max_retries=2
+            )
+        if "embeddings" not in st.session_state:
+            # Initialize embeddings
+            st.session_state.embeddings = HuggingFaceEmbeddings(
+                model_name="sentence-transformers/all-MiniLM-L6-v2"
+            )
+        if "pinecone" not in st.session_state:
+            pinecone_api_key = os.getenv("PINECONE_API_KEY")
+            INDEX_NAME = 'bpl-rag'
+            #initialize vectorstore
+            pc = Pinecone(api_key=pinecone_api_key)
+            index = pc.Index(INDEX_NAME)
+            st.session_state.pinecone = PineconeVectorStore(index=index, embedding=st.session_state.embeddings)
     except Exception as e:
         logger.error(f"Error initializing models: {str(e)}")
             st.error(f"Error displaying source {i}")
 def main():
+    st.title("Digital Commonwealth RAG")
     INDEX_NAME = 'bpl-rag'
     # Initialize session state
     if "messages" not in st.session_state:
         st.session_state.messages = []
     # Initialize models
+    initialize_models()
     # Display chat history
     for message in st.session_state.messages:
         with st.chat_message(message["role"]):
             st.markdown(message["content"])
     # Chat input
+    user_input = st.chat_input("Type your query here...")
     if user_input:
         # Display user message
         with st.chat_message("user"):
             with st.spinner("Let Me Think..."):
                 response, sources = process_message(
                     query=user_input,
+                    llm=st.session_state.llm,
                     index_name=INDEX_NAME,
+                    embeddings=st.session_state.embeddings,
+                    vectorstore=st.session_state.pinecone
                 )
                 if isinstance(response, str):