Spaces:
Runtime error
Runtime error
Commit
•
22472c0
1
Parent(s):
024704e
Create app.py
Browse files
app.py
ADDED
@@ -0,0 +1,93 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import os
|
2 |
+
import tempfile
|
3 |
+
import streamlit as st
|
4 |
+
from streamlit_chat import message
|
5 |
+
from pdfquery import PDFQuery
|
6 |
+
from dotenv import load_dotenv
|
7 |
+
from gtts import gTTS
|
8 |
+
import io
|
9 |
+
import base64
|
10 |
+
|
11 |
+
# Load environment variables from .env file
|
12 |
+
load_dotenv()
|
13 |
+
|
14 |
+
st.set_page_config(page_title="Wise Chat Labs")
|
15 |
+
|
16 |
+
def display_messages():
|
17 |
+
st.subheader("Chat")
|
18 |
+
for i, (msg, is_user) in enumerate(st.session_state["messages"]):
|
19 |
+
message(msg, is_user=is_user, key=str(i))
|
20 |
+
st.session_state["thinking_spinner"] = st.empty()
|
21 |
+
|
22 |
+
def generate_tts_audio(text):
|
23 |
+
tts = gTTS(text=text, lang='en')
|
24 |
+
audio_bytes = io.BytesIO()
|
25 |
+
tts.write_to_fp(audio_bytes)
|
26 |
+
audio_bytes.seek(0)
|
27 |
+
return audio_bytes
|
28 |
+
|
29 |
+
def play_audio(audio_bytes):
|
30 |
+
base64_audio = base64.b64encode(audio_bytes.read()).decode('utf-8')
|
31 |
+
audio_html = f'<audio autoplay><source src="data:audio/mp3;base64,{base64_audio}" type="audio/mp3"></audio>'
|
32 |
+
st.markdown(audio_html, unsafe_allow_html=True)
|
33 |
+
|
34 |
+
def process_input():
|
35 |
+
if st.session_state["user_input"] and len(st.session_state["user_input"].strip()) > 0:
|
36 |
+
user_text = st.session_state["user_input"].strip()
|
37 |
+
with st.session_state["thinking_spinner"], st.spinner("Thinking..."):
|
38 |
+
query_text = st.session_state["pdfquery"].ask(user_text)
|
39 |
+
|
40 |
+
# Generate and play audio for the response with autoplay
|
41 |
+
audio_response = generate_tts_audio(query_text)
|
42 |
+
play_audio(audio_response)
|
43 |
+
|
44 |
+
st.session_state["messages"].append((user_text, True))
|
45 |
+
st.session_state["messages"].append((query_text, False))
|
46 |
+
|
47 |
+
def read_and_save_file():
|
48 |
+
st.session_state["pdfquery"].forget() # to reset the knowledge base
|
49 |
+
st.session_state["messages"] = []
|
50 |
+
st.session_state["user_input"] = ""
|
51 |
+
|
52 |
+
for file in st.session_state["file_uploader"]:
|
53 |
+
with tempfile.NamedTemporaryFile(delete=False) as tf:
|
54 |
+
tf.write(file.getbuffer())
|
55 |
+
file_path = tf.name
|
56 |
+
|
57 |
+
with st.session_state["ingestion_spinner"], st.spinner(f"Ingesting {file.name}"):
|
58 |
+
st.session_state["pdfquery"].ingest(file_path)
|
59 |
+
os.remove(file_path)
|
60 |
+
|
61 |
+
def is_openai_api_key_set() -> bool:
|
62 |
+
return len(st.session_state["OPENAI_API_KEY"]) > 0
|
63 |
+
|
64 |
+
def main():
|
65 |
+
if len(st.session_state) == 0:
|
66 |
+
st.session_state["messages"] = []
|
67 |
+
st.session_state["OPENAI_API_KEY"] = os.getenv("OPENAI_API_KEY", "")
|
68 |
+
if is_openai_api_key_set():
|
69 |
+
st.session_state["pdfquery"] = PDFQuery(st.session_state["OPENAI_API_KEY"])
|
70 |
+
else:
|
71 |
+
st.session_state["pdfquery"] = None
|
72 |
+
|
73 |
+
st.header("ChatPDF")
|
74 |
+
|
75 |
+
st.subheader("Upload a document")
|
76 |
+
st.file_uploader(
|
77 |
+
"Upload document",
|
78 |
+
type=["pdf"],
|
79 |
+
key="file_uploader",
|
80 |
+
on_change=read_and_save_file,
|
81 |
+
label_visibility="collapsed",
|
82 |
+
accept_multiple_files=True,
|
83 |
+
disabled=not is_openai_api_key_set(),
|
84 |
+
)
|
85 |
+
|
86 |
+
st.session_state["ingestion_spinner"] = st.empty()
|
87 |
+
|
88 |
+
display_messages()
|
89 |
+
st.text_input("Message", key="user_input", disabled=not is_openai_api_key_set(), on_change=process_input)
|
90 |
+
|
91 |
+
|
92 |
+
if __name__ == "__main__":
|
93 |
+
main()
|