mistral-super-fast

Sleeping

App Files Files Community

wop commited on Feb 29

Commit

b35606a

•

1 Parent(s): 44b3bcb

Update app.py (#1)

Browse files

- Update app.py (52d69de8d339328ef19de7ed98bf3787ed107748)

Files changed (1) hide show

app.py +9 -26

app.py CHANGED Viewed

@@ -1,26 +1,21 @@
 import json
-from huggingface_hub import InferenceClient
 import gradio as gr
 import random
 API_URL = "https://api-inference.huggingface.co/models/"
-client = InferenceClient(
-    "mistralai/Mistral-7B-Instruct-v0.1"
-)
 def format_prompt(message, history):
     prompt = "You're a helpful assistant."
     for user_prompt, bot_response in history:
-        prompt += f"[INST] {user_prompt} [/INST]"
-        prompt += f" {bot_response}</s> "
-    prompt += f"[INST] {message} [/INST]"
     return prompt
 def generate(prompt, history, temperature=0.9, max_new_tokens=2048, top_p=0.95, repetition_penalty=1.0):
-    temperature = float(temperature)
-    if temperature < 1e-2:
-        temperature = 1e-2
     top_p = float(top_p)
     generate_kwargs = dict(
@@ -40,47 +35,35 @@ def generate(prompt, history, temperature=0.9, max_new_tokens=2048, top_p=0.95,
     for response in stream:
         output += response.token.text
         yield output
-    return output
 def load_database():
     try:
-        # Attempt to load the database from JSON
         with open("database.json", "r", encoding="utf-8") as f:
             return json.load(f)
     except (FileNotFoundError, json.JSONDecodeError):
-        # Handle potential errors gracefully
         print("Error loading database: File not found or invalid format. Creating an empty database.")
-        return []  # Return an empty list if database loading fails
 def save_database(data):
     try:
-        # Save the updated database to JSON
         with open("database.json", "w", encoding="utf-8") as f:
             json.dump(data, f, indent=4)
     except (IOError, json.JSONEncodeError):
-        # Handle potential errors gracefully
         print("Error saving database: Encountered an issue while saving.")
 def chat_interface(message):
     database = load_database()
-    # Check if the question already exists in the database
     if (message, None) not in database:
-        # If not, generate a response and add it to the database
-        response = generate(message, history=[])
         database.append((message, response))
         save_database(database)
     else:
-        # If it does, retrieve the stored response
         _, stored_response = next(item for item in database if item[0] == message)
         response = stored_response
     return response
-with gr.Blocks(theme=gr.themes.Soft()) as demo:
-    # Use "Textbox" components for both input and output
-    input_textbox = gr.Textbox(label="Your question")
-    output_textbox = gr.Textbox(label="Assistant's response", value="", editable=False)
-    # Use demo.launch instead of demo.queue().launch()
-    demo.launch(fn=chat_interface, inputs=input_textbox, outputs=output_textbox)

 import json
 import gradio as gr
 import random
+from huggingface_hub import InferenceClient
 API_URL = "https://api-inference.huggingface.co/models/"
+client = InferenceClient("mistralai/Mistral-7B-Instruct-v0.1")
 def format_prompt(message, history):
     prompt = "You're a helpful assistant."
     for user_prompt, bot_response in history:
+        prompt += f" [INST] {user_prompt} [/INST] {bot_response}</s> "
+    prompt += f" [INST] {message} [/INST]"
     return prompt
 def generate(prompt, history, temperature=0.9, max_new_tokens=2048, top_p=0.95, repetition_penalty=1.0):
+    temperature = float(temperature) if temperature > 0 else 0.01
     top_p = float(top_p)
     generate_kwargs = dict(
     for response in stream:
         output += response.token.text
         yield output
 def load_database():
     try:
         with open("database.json", "r", encoding="utf-8") as f:
             return json.load(f)
     except (FileNotFoundError, json.JSONDecodeError):
         print("Error loading database: File not found or invalid format. Creating an empty database.")
+        return []
 def save_database(data):
     try:
         with open("database.json", "w", encoding="utf-8") as f:
             json.dump(data, f, indent=4)
     except (IOError, json.JSONEncodeError):
         print("Error saving database: Encountered an issue while saving.")
 def chat_interface(message):
     database = load_database()
     if (message, None) not in database:
+        response = next(generate(message, history=[]))
         database.append((message, response))
         save_database(database)
     else:
         _, stored_response = next(item for item in database if item[0] == message)
         response = stored_response
     return response
+with gr.Interface(fn=chat_interface, inputs="textbox", outputs="textbox", title="Chat Interface") as iface:
+    iface.launch()