Spaces:

SURESHBEEKHANI
/

Chat-with-MySQL

Sleeping

App Files Files Community

Suresh Beekhani commited on Sep 24, 2024

Commit

0dd285c

unverified ·

1 Parent(s): 394d592

Update app.py

Browse files

Files changed (1) hide show

src/app.py +97 -93

src/app.py CHANGED Viewed

@@ -1,40 +1,41 @@
-# Import necessary libraries and modules
-from dotenv import load_dotenv   # For loading environment variables from .env
-from langchain_core.messages import AIMessage, HumanMessage  # Message handling
-from langchain_core.prompts import ChatPromptTemplate  # Prompt templates for generating responses
-from langchain_core.runnables import RunnablePassthrough  # To chain operations
-from langchain_community.utilities import SQLDatabase  # SQL database utility for LangChain
-from langchain_core.output_parsers import StrOutputParser  # To parse outputs as strings
-# OpenAI model for chat (if used)
-from langchain_groq import ChatGroq  # Groq model for chat (currently used)
-import streamlit as st  # Streamlit for building the web app
-import os  # To access environment variables
-# Load environment variables from the .env file (like API keys, database credentials)
 load_dotenv()
-# Function to initialize a connection to a MySQL database
 def init_database() -> SQLDatabase:
     try:
-        # Load credentials from environment variables for better security
-        user = os.getenv("DB_USER", "root")
-        password = os.getenv("DB_PASSWORD", "admin")
         host = os.getenv("DB_HOST", "localhost")
-        port = os.getenv("DB_PORT", "3306")
-        database = os.getenv("DB_NAME", "Chinook")
-        # Construct the database URI
-        db_uri = f"mysql+mysqlconnector://{user}:{password}@{host}:{port}/{database}"
-        # Initialize and return the SQLDatabase instance
         return SQLDatabase.from_uri(db_uri)
     except Exception as e:
         st.error(f"Failed to connect to database: {e}")
         return None
-# Function to create a chain that generates SQL queries from user input and conversation history
 def get_sql_chain(db):
-    # SQL prompt template
     template = """
     You are a data analyst at a company. You are interacting with a user who is asking you questions about the company's database.
     Based on the table schema below, write a SQL query that would answer the user's question. Take the conversation history into account.
@@ -47,33 +48,32 @@ def get_sql_chain(db):
     SQL Query:
     """
-    # Create a prompt from the above template
     prompt = ChatPromptTemplate.from_template(template)
-    # Initialize Groq model for generating SQL queries (can switch to OpenAI if needed)
     llm = ChatGroq(model="mixtral-8x7b-32768", temperature=0)
-    # Helper function to get schema info from the database
     def get_schema(_):
         return db.get_table_info()
-    # Chain of operations:
-    # 1. Assign schema information from the database
-    # 2. Use the AI model to generate a SQL query
-    # 3. Parse the result into a string
     return (
-        RunnablePassthrough.assign(schema=get_schema)  # Get schema info from the database
-        | prompt  # Generate SQL query from the prompt template
-        | llm  # Use Groq model to process the prompt and return a SQL query
-        | StrOutputParser()  # Parse the result as a string
     )
-# Function to generate a response in natural language based on the SQL query result
 def get_response(user_query: str, db: SQLDatabase, chat_history: list):
-    # Generate the SQL query using the chain
     sql_chain = get_sql_chain(db)
-    # Prompt template for natural language response based on SQL query and result
     template = """
     You are a data analyst at a company. Based on the table schema, SQL query, and response, write a natural language response.
     <SCHEMA>{schema}</SCHEMA>
@@ -83,90 +83,94 @@ def get_response(user_query: str, db: SQLDatabase, chat_history: list):
     SQL Response: {response}
     """
-    # Create a natural language response prompt
     prompt = ChatPromptTemplate.from_template(template)
-    # Initialize Groq model (alternative: OpenAI)
     llm = ChatGroq(model="mixtral-8x7b-32768", temperature=0)
-    # Build a chain: generate SQL query, run it on the database, generate a natural language response
     chain = (
-        RunnablePassthrough.assign(query=sql_chain).assign(
-            schema=lambda _: db.get_table_info(),  # Get schema info
-            response=lambda vars: db.run(vars["query"]),  # Run SQL query on the database
         )
-        | prompt  # Use prompt to generate a natural language response
-        | llm  # Process prompt with Groq model
-        | StrOutputParser()  # Parse the final result as a string
     )
-    # Execute the chain and return the response
-    return chain.invoke({
         "question": user_query,
         "chat_history": chat_history,
     })
-# Initialize the Streamlit session
 if "chat_history" not in st.session_state:
-    # Initialize chat history with a welcome message from AI
     st.session_state.chat_history = [
         AIMessage(content="Hello! I'm a SQL assistant. Ask me anything about your database."),
     ]
-# Set up the Streamlit web page configuration
-st.set_page_config(page_title="Chat with MySQL", page_icon=":speech_balloon:")
-# Streamlit app title
-st.title("Chat with MySQL")
-# Sidebar for database connection settings
 with st.sidebar:
-    st.subheader("Settings")
-    st.write("Connect to your database and start chatting.")
-    # Database connection input fields
     host = st.text_input("Host", value=os.getenv("DB_HOST", "localhost"))
-    port = st.text_input("Port", value=os.getenv("DB_PORT", "3306"))
-    user = st.text_input("User", value=os.getenv("DB_USER", "root"))
-    password = st.text_input("Password", type="password", value=os.getenv("DB_PASSWORD", "admin"))
-    database = st.text_input("Database", value=os.getenv("DB_NAME", "Chinook"))
-    # Button to connect to the database
     if st.button("Connect"):
-        with st.spinner("Connecting to database..."):
-            # Initialize the database connection and store in session state
-            db = init_database()
             if db:
-                st.session_state.db = db
-                st.success("Connected to the database!")
             else:
-                st.error("Connection failed. Please check your settings.")
-# Display chat history
 for message in st.session_state.chat_history:
     if isinstance(message, AIMessage):
-        # Display AI message
-        with st.chat_message("AI"):
             st.markdown(message.content)
     elif isinstance(message, HumanMessage):
-        # Display human message
-        with st.chat_message("Human"):
             st.markdown(message.content)
-# Input field for user's message
-user_query = st.chat_input("Type a message...")
-if user_query and user_query.strip():
-    # Add user's query to the chat history
-    st.session_state.chat_history.append(HumanMessage(content=user_query))
-    # Display user's message in the chat
-    with st.chat_message("Human"):
         st.markdown(user_query)
-    # Generate and display AI's response based on the query
-    with st.chat_message("AI"):
-        response = get_response(user_query, st.session_state.db, st.session_state.chat_history)
         st.markdown(response)
-    # Add AI's response to the chat history
-    st.session_state.chat_history.append(AIMessage(content=response))

+# Import necessary libraries and modules for various tasks
+from dotenv import load_dotenv  # For loading environment variables from a .env file (such as database credentials)
+from langchain_core.messages import AIMessage, HumanMessage  # For handling messages from the AI and user
+from langchain_core.prompts import ChatPromptTemplate  # To create templates that will guide the chatbot's responses
+from langchain_core.runnables import RunnablePassthrough  # To enable chaining of different operations (like inputs/outputs)
+from langchain_community.utilities import SQLDatabase  # A tool to help connect to SQL databases using LangChain
+from langchain_core.output_parsers import StrOutputParser  # To parse outputs into plain text
+from langchain_groq import ChatGroq  # This integrates the Groq model for generating chat responses
+import streamlit as st  # Streamlit is used for building the web app (user interface)
+import os  # To access environment variables (e.g., credentials or other settings)
+import psycopg2  # A PostgreSQL database adapter to enable connections to the database
+# Load environment variables (such as DB credentials) from the .env file
 load_dotenv()
+# Function to establish a connection to the PostgreSQL database
 def init_database() -> SQLDatabase:
     try:
+        # Retrieve database connection details from environment variables, or set default values
+        user = os.getenv("DB_USER", "postgres")
+        password = os.getenv("DB_PASSWORD", "beekhani143")
         host = os.getenv("DB_HOST", "localhost")
+        port = os.getenv("DB_PORT", "5432")
+        database = os.getenv("DB_NAME", "")
+        # Construct the database URI (a URL-like string) with the necessary credentials for PostgreSQL
+        db_uri = f"postgresql+psycopg2://{user}:{password}@{host}:{port}/{database}"
+        # Connect to the database using the SQLDatabase utility and return the instance
         return SQLDatabase.from_uri(db_uri)
     except Exception as e:
+        # If connection fails, display an error message on the Streamlit UI
         st.error(f"Failed to connect to database: {e}")
         return None
+# Function to create a process (chain) that generates SQL queries based on user input and previous conversation
 def get_sql_chain(db):
+    # Template to guide how SQL queries are generated. The bot receives table schema and conversation history.
     template = """
     You are a data analyst at a company. You are interacting with a user who is asking you questions about the company's database.
     Based on the table schema below, write a SQL query that would answer the user's question. Take the conversation history into account.
     SQL Query:
     """
+    # Create a prompt template from the above instructions
     prompt = ChatPromptTemplate.from_template(template)
+    # Initialize the Groq model for generating responses with low randomness (temperature=0 for more deterministic outputs)
     llm = ChatGroq(model="mixtral-8x7b-32768", temperature=0)
+    # Function to get the schema (structure) of the tables in the database
     def get_schema(_):
         return db.get_table_info()
+    # Create a chain of operations:
+    # 1. First, get the database schema.
+    # 2. Then, use the prompt template to guide query creation.
+    # 3. Finally, parse the output as a plain text SQL query.
     return (
+        RunnablePassthrough.assign(schema=get_schema)  # Pass the schema into the chain
+        | prompt  # Use the prompt template
+        | llm  # Generate a response using the Groq model
+        | StrOutputParser()  # Parse the response as a string (SQL query)
     )
+# Function to generate a natural language response based on SQL query and database result
 def get_response(user_query: str, db: SQLDatabase, chat_history: list):
+    # First, get the SQL chain (responsible for generating SQL queries)
     sql_chain = get_sql_chain(db)
+    # Template to guide how the AI responds to the user's query based on the SQL results
     template = """
     You are a data analyst at a company. Based on the table schema, SQL query, and response, write a natural language response.
     <SCHEMA>{schema}</SCHEMA>
     SQL Response: {response}
     """
+    # Create a new prompt template for generating a response
     prompt = ChatPromptTemplate.from_template(template)
+    # Initialize the Groq model for response generation
     llm = ChatGroq(model="mixtral-8x7b-32768", temperature=0)
+    # Chain the following tasks:
+    # 1. Generate the SQL query using the earlier chain.
+    # 2. Get the schema and execute the query on the database.
+    # 3. Return the natural language response based on the query and its results.
     chain = (
+        RunnablePassthrough.assign(query=sql_chain)  # Generate SQL query
+        .assign(
+            schema=lambda _: db.get_table_info(),  # Pass the schema to the next step
+            response=lambda vars: db.run(vars["query"].replace("\\", "")),  # Execute the SQL query and clean up backslashes
         )
+        | prompt  # Use the prompt template for generating natural language response
+        | llm  # Generate the final response using the model
+        | StrOutputParser()  # Parse the output into plain text
     )
+    # Invoke the chain to generate the final response based on the user query and history
+    result = chain.invoke({
         "question": user_query,
         "chat_history": chat_history,
     })
+    # Debugging: Print the SQL query being executed
+    if isinstance(result, str):
+        print(f"SQL Query: {result}")
+    else:
+        sql_query = result.get('query', 'No query generated')
+        print(f"SQL Query: {sql_query}")
+    # Return the result (natural language response)
+    return result
+# Initialize the chat session when Streamlit app starts
 if "chat_history" not in st.session_state:
     st.session_state.chat_history = [
+        # First message from AI assistant
         AIMessage(content="Hello! I'm a SQL assistant. Ask me anything about your database."),
     ]
+# Streamlit page configuration: Set the page title and icon
+st.set_page_config(page_title="Chat with PostgreSQL", page_icon=":speech_balloon:")
+st.title("Chat with PostgreSQL")  # Display title on the webpage
+# Sidebar configuration for database connection settings
 with st.sidebar:
+    st.subheader("Settings")  # Display a heading for the settings section
+    st.write("Connect to your database and start chatting.")  # Instruction text for users
+    # Input fields for database connection details (host, port, user, password, and database name)
     host = st.text_input("Host", value=os.getenv("DB_HOST", "localhost"))
+    port = st.text_input("Port", value=os.getenv("DB_PORT", "5432"))
+    user = st.text_input("User", value=os.getenv("DB_USER", "postgres"))
+    password = st.text_input("Password", type="password", value=os.getenv("DB_PASSWORD", "beekhani143"))
+    database = st.text_input("Database", value=os.getenv("DB_NAME", "db"))
+    # Button to attempt database connection
     if st.button("Connect"):
+        with st.spinner("Connecting to database..."):  # Show a spinner while connecting
+            db = init_database()  # Call the function to connect to the database
             if db:
+                st.session_state.db = db  # Save the connection in session state
+                st.success("Connected to the database!")  # Display success message
             else:
+                st.error("Connection failed. Please check your settings.")  # Display error message if connection fails
+# Display the chat history (both AI and user messages)
 for message in st.session_state.chat_history:
     if isinstance(message, AIMessage):
+        with st.chat_message("AI"):  # Display AI messages in the chat
             st.markdown(message.content)
     elif isinstance(message, HumanMessage):
+        with st.chat_message("Human"):  # Display human messages in the chat
             st.markdown(message.content)
+# Input field for the user to type their message
+user_query = st.chat_input("Type a message...")  # Field to capture user query
+if user_query and user_query.strip():  # If the user entered a valid query
+    st.session_state.chat_history.append(HumanMessage(content=user_query))  # Save the user query in chat history
+    with st.chat_message("Human"):  # Display the user's message in the chat
         st.markdown(user_query)
+    with st.chat_message("AI"):  # Generate and display the AI response
+        response = get_response(user_query, st.session_state.db, st.session_state.chat_history)  # Get the AI's response
         st.markdown(response)
+    st.session_state.chat_history.append(AIMessage(content=response))  # Add the AI's response to the chat history