Spaces:

andreped
/

chatbot-streamlit-demo

Build error

andreped commited on Oct 18, 2023

Commit

60a59c6

•

1 Parent(s): 183d24b

Use gdown python API to automatically download test data during launch

Files changed (3) hide show

.gitignore CHANGED Viewed

@@ -1,5 +1,4 @@
-secrets.toml
 venv/
 data/
 .DS_Store
-config.json

 venv/
 data/
 .DS_Store
+config.json

README.md CHANGED Viewed

@@ -20,14 +20,20 @@ pip install -r requirements.txt
 export OPENAI_API_KEY=<insert key here>
 ```
-3. Download test data:
 ```
-gdown https://drive.google.com/drive/folders/1uDSAWtLvp1YPzfXUsK_v6DeWta16pq6y -O ./data/ --folder
 ```
-3. Launch the app:
 ```
 streamlit run app.py
 ```
-You can then access the app in your browser at `http://localhost:8501`

 export OPENAI_API_KEY=<insert key here>
 ```
+3. Create the `config.json` file and fill in the relevant info:
 ```
+{
+    "CHATGPT_MODEL":"<insert model name>",
+    "OPENAI_API_BASE":"https://<insert-openai-service-name>.openai.azure.com",
+    "OPENAI_API_VERSION":"<insert version>",
+    "ENGINE": "<insert deployment model name>",
+    "ENGINE_EMBEDDING": "<insert deployment embedding name>"
+}
 ```
+4. Launch the app:
 ```
 streamlit run app.py
 ```
+A Streamlit browser window should automatically open. If not, the app can be accessed at `http://localhost:8501`

app.py CHANGED Viewed

@@ -2,6 +2,7 @@ import json
 import os
 import streamlit as st
 from llama_index import ServiceContext
 from llama_index import SimpleDirectoryReader
 from llama_index import VectorStoreIndex
@@ -9,6 +10,7 @@ from llama_index import set_global_service_context
 from llama_index.embeddings import OpenAIEmbedding
 from llama_index.llms import AzureOpenAI
 # Initialize message history
 st.header("Chat with André's research 💬 📚")
@@ -20,6 +22,12 @@ with open(r"config.json") as config_file:
     config_details = json.load(config_file)
 @st.cache_resource(show_spinner=False)
 def load_data():
     with st.spinner(text="Loading and indexing the provided dataset – hang tight! This may take a few seconds."):
@@ -53,6 +61,7 @@ def load_data():
 def main():
     index = load_data()
     chat_engine = index.as_chat_engine(chat_mode="condense_question", verbose=True)

 import os
 import streamlit as st
+from gdown import download_folder
 from llama_index import ServiceContext
 from llama_index import SimpleDirectoryReader
 from llama_index import VectorStoreIndex
 from llama_index.embeddings import OpenAIEmbedding
 from llama_index.llms import AzureOpenAI
 # Initialize message history
 st.header("Chat with André's research 💬 📚")
     config_details = json.load(config_file)
+def download_test_data():
+    url = "https://drive.google.com/drive/folders/1uDSAWtLvp1YPzfXUsK_v6DeWta16pq6y"
+    with st.spinner(text="Downloading test data. Might take a few seconds."):
+        download_folder(url, quiet=True, use_cookies=False, output="./data/")
 @st.cache_resource(show_spinner=False)
 def load_data():
     with st.spinner(text="Loading and indexing the provided dataset – hang tight! This may take a few seconds."):
 def main():
+    download_test_data()
     index = load_data()
     chat_engine = index.as_chat_engine(chat_mode="condense_question", verbose=True)