Spaces:

AI-ANK
/

AInimal_Go

Running

App Files Files Community

AI-ANK commited on Nov 26, 2023

Commit

ffa0700

1 Parent(s): 9a275cd

Update app.py

Browse files

Files changed (1) hide show

app.py +50 -25

app.py CHANGED Viewed

@@ -8,6 +8,8 @@ from llama_index import ServiceContext, VectorStoreIndex, Document, StorageConte
 from llama_index.memory import ChatMemoryBuffer
 import os
 import datetime
 #imports for resnet
 from transformers import AutoFeatureExtractor, ResNetForImageClassification
@@ -45,8 +47,7 @@ This application, titled 'AInimal Go!', is a conceptual prototype designed to de
 cookie_manager = stx.CookieManager()
 #Function to init resnet
-@st.cache_resource()
 def load_model_and_labels():
     # Load animal labels as a dictionary
     animal_labels_dict = {}
@@ -81,9 +82,11 @@ def get_image_caption(image_data):
     return predicted_label_name, predicted_label_id
-@st.cache_resource
 def init_llm(api_key):
-    llm = PaLM(api_key=api_key)
     service_context = ServiceContext.from_defaults(llm=llm, embed_model="local")
     storage_context = StorageContext.from_defaults(persist_dir="storage")
@@ -92,27 +95,34 @@ def init_llm(api_key):
     return llm, service_context, storage_context, index, chatmemory
-llm, service_context, storage_context, index, chatmemory = init_llm(st.secrets['GOOGLE_API_KEY'])
 def is_animal(predicted_label_id):
     # Check if the predicted label ID is within the animal classes range
     return 0 <= predicted_label_id <= 398
 # Function to create the chat engine.
 @st.cache_resource
 def create_chat_engine(img_desc, api_key):
     doc = Document(text=img_desc)
-    chat_engine = index.as_chat_engine(
-        chat_mode="react",
-        verbose=True,
-        memory=chatmemory
     )
-    return chat_engine
 # Clear chat function
 def clear_chat():
     if "messages" in st.session_state:
@@ -149,7 +159,7 @@ else:
     col1, col2, col3 = st.columns([1, 2, 1])
     with col2:  # Camera input will be in the middle column
-        camera_image = st.camera_input("Take a picture")
     # Determine the source of the image (upload or camera)
@@ -162,17 +172,20 @@ else:
     if image_data:
         # Display the uploaded image at a standard width.
         st.image(image_data, caption='Uploaded Image.', width=200)
         # Process the uploaded image to get a caption.
         img_desc, label_id = get_image_caption(image_data)
         if not (is_animal(label_id)):
             st.error("Please upload image of an animal!")
             st.stop()
         # Initialize the chat engine with the image description.
-        chat_engine = create_chat_engine(img_desc, st.secrets['GOOGLE_API_KEY'])
         st.write("Image Uploaded Successfully. Ask me anything about it.")
@@ -182,8 +195,9 @@ else:
     # Display previous messages
     for message in st.session_state.messages:
-        with st.chat_message(message["role"]):
-            st.markdown(message["content"])
     # Handle new user input
     user_input = st.chat_input("Ask me about the image:", key="chat_input")
@@ -193,27 +207,38 @@ else:
         # Display user message immediately
         with st.chat_message("user"):
-            st.markdown(user_input)
         # Call the chat engine to get the response if an image has been uploaded
         if image_data and user_input:
             try:
                 with st.spinner('Waiting for the chat engine to respond...'):
                     # Get the response from your chat engine
-                    response = chat_engine.chat(f"""You are a chatbot that roleplays as an animal and also makes animal sounds when chatting.
-                    You always answer in great detail and are polite. Your responses always descriptive.
-                    Your job is to rolelpay as the animal that is mentioned in the image the user has uploaded. Image description: {img_desc}. User question
-                    {user_input}""")
                 # Append assistant message to the session state
-                st.session_state.messages.append({"role": "assistant", "content": response})
                 # Display the assistant message
                 with st.chat_message("assistant"):
-                    st.markdown(response)
             except Exception as e:
                 st.error(f'An error occurred.')
             # Increment the message count and update the cookie
             message_count += 1

 from llama_index.memory import ChatMemoryBuffer
 import os
 import datetime
+from llama_index.llms import Cohere
+from llama_index.query_engine import CitationQueryEngine
 #imports for resnet
 from transformers import AutoFeatureExtractor, ResNetForImageClassification
 cookie_manager = stx.CookieManager()
 #Function to init resnet
+@st.cache_resource(show_spinner="Initializing ResNet model for image classification. Please wait...")
 def load_model_and_labels():
     # Load animal labels as a dictionary
     animal_labels_dict = {}
     return predicted_label_name, predicted_label_id
+@st.cache_resource(show_spinner="Initializing LLM and setting up service context. Please wait...")
 def init_llm(api_key):
+#    llm = PaLM(api_key=api_key)
+    llm = Cohere(model="command", api_key=st.secrets['COHERE_API_TOKEN'])
     service_context = ServiceContext.from_defaults(llm=llm, embed_model="local")
     storage_context = StorageContext.from_defaults(persist_dir="storage")
     return llm, service_context, storage_context, index, chatmemory
+llm, service_context, storage_context, index, chatmemory = init_llm(os.environ["GOOGLE_API_KEY"])
 def is_animal(predicted_label_id):
     # Check if the predicted label ID is within the animal classes range
     return 0 <= predicted_label_id <= 398
 # Function to create the chat engine.
 @st.cache_resource
 def create_chat_engine(img_desc, api_key):
+    #llm = PaLM(api_key=api_key)
+    #service_context = ServiceContext.from_defaults(llm=llm,embed_model="local")
     doc = Document(text=img_desc)
+    # Now is_animal is a boolean indicating whether the image is of an animal
+    print("Is the image of an animal:", is_animal)
+    query_engine = CitationQueryEngine.from_args(
+        index,
+        similarity_top_k=3,
+        # here we can control how granular citation sources are, the default is 512
+        citation_chunk_size=512,
+        verbose=True
     )
+    return query_engine
 # Clear chat function
 def clear_chat():
     if "messages" in st.session_state:
     col1, col2, col3 = st.columns([1, 2, 1])
     with col2:  # Camera input will be in the middle column
+        camera_image = st.camera_input("Take a picture", on_change=on_image_upload)
     # Determine the source of the image (upload or camera)
     if image_data:
         # Display the uploaded image at a standard width.
+        st.session_state['assistant_avatar'] = image_data
         st.image(image_data, caption='Uploaded Image.', width=200)
         # Process the uploaded image to get a caption.
+        #img_desc = get_image_caption(image_data)
         img_desc, label_id = get_image_caption(image_data)
         if not (is_animal(label_id)):
+            #st.error("Please upload image of an animal!")
             st.error("Please upload image of an animal!")
             st.stop()
         # Initialize the chat engine with the image description.
+        chat_engine = create_chat_engine(img_desc, os.environ["GOOGLE_API_KEY"])
         st.write("Image Uploaded Successfully. Ask me anything about it.")
     # Display previous messages
     for message in st.session_state.messages:
+        avatar = st.session_state['assistant_avatar'] if message["role"] == "assistant" else None
+        with st.chat_message(message["role"], avatar = avatar):
+            st.write(message["content"])
     # Handle new user input
     user_input = st.chat_input("Ask me about the image:", key="chat_input")
         # Display user message immediately
         with st.chat_message("user"):
+            st.write(user_input)
         # Call the chat engine to get the response if an image has been uploaded
         if image_data and user_input:
             try:
                 with st.spinner('Waiting for the chat engine to respond...'):
                     # Get the response from your chat engine
+                    system_prompt=f"""
+                    You are a chatbot, able to have normal interactions. Do not make up information.
+                    You always answer in great detail and are polite. Your job is to roleplay as an {img_desc}.
+                    Remember to make {img_desc} sounds while talking but dont overdo it.
+                    """
+                    response = chat_engine.query(f"{system_prompt}. {user_input}")
+                    #response = chat_engine.chat(f"""You are a chatbot that roleplays as an animal and also makes animal sounds when chatting.
+                    #You always answer in great detail and are polite. Your responses always descriptive.
+                    #Your job is to rolelpay as the animal that is mentioned in the image the user has uploaded. Image description: {img_desc}. User question
+                    #{user_input}""")
                 # Append assistant message to the session state
+                st.session_state.messages.append({"role": "assistant", "content": response.response})
                 # Display the assistant message
                 with st.chat_message("assistant"):
+                    st.write(response.response)
+                    st.expander("hello")
             except Exception as e:
                 st.error(f'An error occurred.')
+                # Optionally, you can choose to break the flow here if a critical error happens
+                # return
             # Increment the message count and update the cookie
             message_count += 1