wise-labs-new / app.py
parvezalmuqtadir's picture
Update app.py
e5e4cf0 verified
import os
import io
import streamlit as st
from streamlit_chat import message
from dotenv import load_dotenv
from gtts import gTTS
from audiorecorder import audiorecorder
from pdfquery import PDFQuery
import whisper
import urllib.request
from urllib.request import urlopen
import ssl
import json
ssl._create_default_https_context = ssl._create_unverified_context
# Load environment variables from .env file
load_dotenv()
st.set_page_config(page_title="Wise Chat Labs - Advanced")
def display_messages():
st.subheader("Chat with your PDF")
for i, (msg, is_user) in enumerate(st.session_state["messages"]):
message(msg, is_user=is_user, key=str(i))
st.session_state["thinking_spinner"] = st.empty()
def generate_tts_audio(text):
tts = gTTS(text=text, lang='en')
audio_bytes = io.BytesIO()
tts.write_to_fp(audio_bytes)
audio_bytes.seek(0)
return audio_bytes
def play_audio(audio_bytes):
audio_bytes.seek(0)
st.audio(audio_bytes, format='audio/mp3', start_time=0)
def process_input(user_text):
with st.session_state["thinking_spinner"], st.spinner("Thinking..."):
query_text = st.session_state["pdfquery"].ask(user_text)
audio_response = generate_tts_audio(query_text)
play_audio(audio_response)
st.session_state["messages"].append((user_text, True))
st.session_state["messages"].append((query_text, False))
def load_and_ingest_document():
file_path = 'osha.pdf'
if os.path.exists(file_path):
st.session_state["pdfquery"].ingest(file_path)
else:
st.error("PDF file not found. Please ensure 'osha.pdf' is in the root directory.")
def is_openai_api_key_set() -> bool:
return len(st.session_state.get("OPENAI_API_KEY", "")) > 0
def transcribe_audio_to_text(audio_file_path):
model = whisper.load_model("base")
result = model.transcribe(audio_file_path)
return result["text"]
def main():
if 'messages' not in st.session_state:
st.session_state['messages'] = []
st.header("Wise Chat Labs - Your Ultimate Chatbot")
display_messages()
if 'OPENAI_API_KEY' not in st.session_state:
st.session_state['OPENAI_API_KEY'] = os.getenv("OPENAI_API_KEY", "")
if is_openai_api_key_set():
st.session_state['pdfquery'] = PDFQuery(st.session_state["OPENAI_API_KEY"])
load_and_ingest_document()
else:
st.session_state['pdfquery'] = None
st.error("OpenAI API key is not set. Please check your .env file.")
user_input = st.text_input("Type your message here...", key="user_input")
if user_input:
process_input(user_input)
st.title("Or speak your message...")
audio = audiorecorder("Start Talking", "Click to stop", key="audio_recorder")
if audio is not None and hasattr(audio, 'export'):
audio_file_path = "user_audio_input.wav"
audio.export(audio_file_path, format="wav")
user_text = transcribe_audio_to_text(audio_file_path)
process_input(user_text)
if __name__ == "__main__":
main()