Spaces:

Bhaskar2611
/

Capstone

Paused

App Files Files Community

Bhaskar2611 commited on Oct 9, 2024

Commit

edb8de4

verified ·

1 Parent(s): a66fbb9

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -8

app.py CHANGED Viewed

@@ -67,6 +67,7 @@ from huggingface_hub import InferenceClient
 client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
 def respond(
     message,
     history: list[tuple[str, str]],
@@ -76,18 +77,22 @@ def respond(
     top_p,
 ):
     try:
         messages = [{"role": "system", "content": system_message}]
-        for val in history:
-            if val[0]:
-                messages.append({"role": "user", "content": val[0]})
-            if val[1]:
-                messages.append({"role": "assistant", "content": val[1]})
         messages.append({"role": "user", "content": message})
         response = ""
         for message in client.chat_completion(
             messages,
             max_tokens=max_tokens,
@@ -98,10 +103,12 @@ def respond(
             token = message.choices[0].delta.content
             response += token
             yield response
-    except Exception as e:
-        # Catching any errors and displaying a fallback message instead
-        yield "Sorry, something went wrong. Please try again."
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
@@ -116,7 +123,11 @@ demo = gr.ChatInterface(
             label="Top-p (nucleus sampling)",
         ),
     ],
 )
 if __name__ == "__main__":
     demo.launch()

 client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
+# Function to respond to user input while maintaining chat history
 def respond(
     message,
     history: list[tuple[str, str]],
     top_p,
 ):
     try:
+        # Append system message at the start
         messages = [{"role": "system", "content": system_message}]
+        # Append the chat history
+        for user_msg, bot_reply in history:
+            if user_msg:
+                messages.append({"role": "user", "content": user_msg})
+            if bot_reply:
+                messages.append({"role": "assistant", "content": bot_reply})
+        # Add the latest user message
         messages.append({"role": "user", "content": message})
         response = ""
+        # Stream the response token by token to avoid loading delays
         for message in client.chat_completion(
             messages,
             max_tokens=max_tokens,
             token = message.choices[0].delta.content
             response += token
             yield response
+    except Exception:
+        # Suppress any error and maintain conversation without showing error icon or message
+        yield "Error handled silently."  # You can replace this with "" to hide any message
+# Gradio interface with preserved history and customizable chatbot behavior
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
             label="Top-p (nucleus sampling)",
         ),
     ],
+    # Enable to retain history and suppress errors
+    retain_history=True,  # This will ensure the chat history is not lost between interactions
+    retry_on_error=False  # Prevent showing the error message or retry button
 )
 if __name__ == "__main__":
     demo.launch()