Gemini

Sleeping

App Files Files Community

tedslin commited on Jan 2

Commit

ca02256

•

1 Parent(s): 264871b

Update app.py

Browse files

Files changed (1) hide show

app.py +96 -38

app.py CHANGED Viewed

@@ -24,10 +24,7 @@ DUPLICATE = """
 </div>
 """
-AVATAR_IMAGES = (
-    None,
-    "https://media.roboflow.com/spaces/gemini-icon.png"
-)
 IMAGE_CACHE_DIRECTORY = "/tmp"
 IMAGE_WIDTH = 512
@@ -54,22 +51,22 @@ def cache_pil_image(image: Image.Image) -> str:
 def preprocess_chat_history(
-    history: CHAT_HISTORY
 ) -> List[Dict[str, Union[str, List[str]]]]:
     messages = []
     for user_message, model_message in history:
         if isinstance(user_message, tuple):
             pass
         elif user_message is not None:
-            messages.append({'role': 'user', 'parts': [user_message]})
         if model_message is not None:
-            messages.append({'role': 'model', 'parts': [model_message]})
     return messages
 def upload(files: Optional[List[str]], chatbot: CHAT_HISTORY) -> CHAT_HISTORY:
     for file in files:
-        image = Image.open(file).convert('RGB')
         image = preprocess_image(image)
         image_path = cache_pil_image(image)
         chatbot.append(((image_path,), None))
@@ -90,7 +87,9 @@ def bot(
     stop_sequences: str,
     top_k: int,
     top_p: float,
-    chatbot: CHAT_HISTORY
 ):
     if len(chatbot) == 0:
         return chatbot
@@ -99,7 +98,12 @@ def bot(
     if not google_key:
         raise ValueError(
             "GOOGLE_API_KEY is not set. "
-            "Please follow the instructions in the README to set it up.")
     genai.configure(api_key=google_key)
     generation_config = genai.types.GenerationConfig(
@@ -107,31 +111,38 @@ def bot(
         max_output_tokens=max_output_tokens,
         stop_sequences=preprocess_stop_sequences(stop_sequences=stop_sequences),
         top_k=top_k,
-        top_p=top_p)
     if files:
-        text_prompt = [chatbot[-1][0]] \
-            if chatbot[-1][0] and isinstance(chatbot[-1][0], str) \
             else []
-        image_prompt = [Image.open(file).convert('RGB') for file in files]
-        model = genai.GenerativeModel('gemini-pro-vision')
         response = model.generate_content(
             text_prompt + image_prompt,
             stream=True,
-            generation_config=generation_config)
     else:
         messages = preprocess_chat_history(chatbot)
-        model = genai.GenerativeModel('gemini-pro')
         response = model.generate_content(
             messages,
             stream=True,
-            generation_config=generation_config)
     # streaming effect
     chatbot[-1][1] = ""
     for chunk in response:
         for i in range(0, len(chunk.text), 10):
-            section = chunk.text[i:i + 10]
             chatbot[-1][1] += section
             time.sleep(0.01)
             yield chatbot
@@ -143,18 +154,19 @@ google_key_component = gr.Textbox(
     type="password",
     placeholder="...",
     info="You have to provide your own GOOGLE_API_KEY for this app to function properly",
-    visible=GOOGLE_API_KEY is None
 )
 chatbot_component = gr.Chatbot(
-    label='Gemini',
     bubble_full_width=False,
     avatar_images=AVATAR_IMAGES,
     scale=2,
-    height=400
 )
 text_prompt_component = gr.Textbox(
     placeholder="Hi there! [press Enter]", show_label=False, autofocus=True, scale=8
 )
 upload_button_component = gr.UploadButton(
     label="Upload Images", file_count="multiple", file_types=["image"], scale=1
 )
@@ -169,7 +181,8 @@ temperature_component = gr.Slider(
         "Temperature controls the degree of randomness in token selection. Lower "
         "temperatures are good for prompts that expect a true or correct response, "
         "while higher temperatures can lead to more diverse or unexpected results. "
-    ))
 max_output_tokens_component = gr.Slider(
     minimum=1,
     maximum=2048,
@@ -178,8 +191,9 @@ max_output_tokens_component = gr.Slider(
     label="Token limit",
     info=(
         "Token limit determines the maximum amount of text output from one prompt. A "
-        "token is approximately four characters. The default value is 2048."
-    ))
 stop_sequences_component = gr.Textbox(
     label="Add stop sequence",
     value="",
@@ -189,7 +203,8 @@ stop_sequences_component = gr.Textbox(
         "A stop sequence is a series of characters (including spaces) that stops "
         "response generation if the model encounters it. The sequence is not included "
         "as part of the response. You can add up to five stop sequences."
-    ))
 top_k_component = gr.Slider(
     minimum=1,
     maximum=40,
@@ -202,7 +217,8 @@ top_k_component = gr.Slider(
         "vocabulary (also called greedy decoding), while a top-k of 3 means that the "
         "next token is selected from among the 3 most probable tokens (using "
         "temperature)."
-    ))
 top_p_component = gr.Slider(
     minimum=0,
     maximum=1,
@@ -215,12 +231,44 @@ top_p_component = gr.Slider(
         "top-p value. For example, if tokens A, B, and C have a probability of .3, .2, "
         "and .1 and the top-p value is .5, then the model will select either A or B as "
         "the next token (using temperature). "
-    ))
-user_inputs = [
-    text_prompt_component,
-    chatbot_component
-]
 bot_inputs = [
     google_key_component,
@@ -230,7 +278,9 @@ bot_inputs = [
     stop_sequences_component,
     top_k_component,
     top_p_component,
-    chatbot_component
 ]
 with gr.Blocks() as demo:
@@ -242,12 +292,16 @@ with gr.Blocks() as demo:
         chatbot_component.render()
         with gr.Row():
             text_prompt_component.render()
             upload_button_component.render()
             run_button_component.render()
         with gr.Accordion("Parameters", open=False):
             temperature_component.render()
             max_output_tokens_component.render()
             stop_sequences_component.render()
             with gr.Accordion("Advanced", open=False):
                 top_k_component.render()
                 top_p_component.render()
@@ -256,25 +310,29 @@ with gr.Blocks() as demo:
         fn=user,
         inputs=user_inputs,
         outputs=[text_prompt_component, chatbot_component],
-        queue=False
     ).then(
-        fn=bot, inputs=bot_inputs, outputs=[chatbot_component],
     )
     text_prompt_component.submit(
         fn=user,
         inputs=user_inputs,
         outputs=[text_prompt_component, chatbot_component],
-        queue=False
     ).then(
-        fn=bot, inputs=bot_inputs, outputs=[chatbot_component],
     )
     upload_button_component.upload(
         fn=upload,
         inputs=[upload_button_component, chatbot_component],
         outputs=[chatbot_component],
-        queue=False
     )
 demo.queue(max_size=99).launch(debug=False, show_error=True)

 </div>
 """
+AVATAR_IMAGES = (None, "https://media.roboflow.com/spaces/gemini-icon.png")
 IMAGE_CACHE_DIRECTORY = "/tmp"
 IMAGE_WIDTH = 512
 def preprocess_chat_history(
+    history: CHAT_HISTORY,
 ) -> List[Dict[str, Union[str, List[str]]]]:
     messages = []
     for user_message, model_message in history:
         if isinstance(user_message, tuple):
             pass
         elif user_message is not None:
+            messages.append({"role": "user", "parts": [user_message]})
         if model_message is not None:
+            messages.append({"role": "model", "parts": [model_message]})
     return messages
 def upload(files: Optional[List[str]], chatbot: CHAT_HISTORY) -> CHAT_HISTORY:
     for file in files:
+        image = Image.open(file).convert("RGB")
         image = preprocess_image(image)
         image_path = cache_pil_image(image)
         chatbot.append(((image_path,), None))
     stop_sequences: str,
     top_k: int,
     top_p: float,
+    categories: Optional[List[str]],
+    threshold: str,
+    chatbot: CHAT_HISTORY,
 ):
     if len(chatbot) == 0:
         return chatbot
     if not google_key:
         raise ValueError(
             "GOOGLE_API_KEY is not set. "
+            "Please follow the instructions in the README to set it up."
+        )
+    safety_settings = []
+    for category in categories:
+        safety_settings.append({"category": category, "threshold": threshold})
     genai.configure(api_key=google_key)
     generation_config = genai.types.GenerationConfig(
         max_output_tokens=max_output_tokens,
         stop_sequences=preprocess_stop_sequences(stop_sequences=stop_sequences),
         top_k=top_k,
+        top_p=top_p,
+    )
     if files:
+        text_prompt = (
+            [chatbot[-1][0]]
+            if chatbot[-1][0] and isinstance(chatbot[-1][0], str)
             else []
+        )
+        image_prompt = [Image.open(file).convert("RGB") for file in files]
+        model = genai.GenerativeModel("gemini-pro-vision")
         response = model.generate_content(
             text_prompt + image_prompt,
             stream=True,
+            generation_config=generation_config,
+            safety_settings=safety_settings,
+        )
     else:
         messages = preprocess_chat_history(chatbot)
+        model = genai.GenerativeModel("gemini-pro")
         response = model.generate_content(
             messages,
             stream=True,
+            generation_config=generation_config,
+            safety_settings=safety_settings,
+        )
     # streaming effect
     chatbot[-1][1] = ""
     for chunk in response:
         for i in range(0, len(chunk.text), 10):
+            section = chunk.text[i : i + 10]
             chatbot[-1][1] += section
             time.sleep(0.01)
             yield chatbot
     type="password",
     placeholder="...",
     info="You have to provide your own GOOGLE_API_KEY for this app to function properly",
+    visible=GOOGLE_API_KEY is None,
 )
 chatbot_component = gr.Chatbot(
+    label="Gemini",
     bubble_full_width=False,
     avatar_images=AVATAR_IMAGES,
     scale=2,
+    height=400,
 )
 text_prompt_component = gr.Textbox(
     placeholder="Hi there! [press Enter]", show_label=False, autofocus=True, scale=8
 )
 upload_button_component = gr.UploadButton(
     label="Upload Images", file_count="multiple", file_types=["image"], scale=1
 )
         "Temperature controls the degree of randomness in token selection. Lower "
         "temperatures are good for prompts that expect a true or correct response, "
         "while higher temperatures can lead to more diverse or unexpected results. "
+    ),
+)
 max_output_tokens_component = gr.Slider(
     minimum=1,
     maximum=2048,
     label="Token limit",
     info=(
         "Token limit determines the maximum amount of text output from one prompt. A "
+        "token is approximately four characters. The max value is 2048."
+    ),
+)
 stop_sequences_component = gr.Textbox(
     label="Add stop sequence",
     value="",
         "A stop sequence is a series of characters (including spaces) that stops "
         "response generation if the model encounters it. The sequence is not included "
         "as part of the response. You can add up to five stop sequences."
+    ),
+)
 top_k_component = gr.Slider(
     minimum=1,
     maximum=40,
         "vocabulary (also called greedy decoding), while a top-k of 3 means that the "
         "next token is selected from among the 3 most probable tokens (using "
         "temperature)."
+    ),
+)
 top_p_component = gr.Slider(
     minimum=0,
     maximum=1,
         "top-p value. For example, if tokens A, B, and C have a probability of .3, .2, "
         "and .1 and the top-p value is .5, then the model will select either A or B as "
         "the next token (using temperature). "
+    ),
+)
+category_dropdown_component = gr.Dropdown(
+    label="Category",
+    choices=[
+        "HARM_CATEGORY_DANGEROUS",
+        "HARM_CATEGORY_HARASSMENT",
+        "HARM_CATEGORY_HATE_SPEECH",
+        "HARM_CATEGORY_SEXUALLY_EXPLICIT",
+    ],
+    value=[
+        "HARM_CATEGORY_DANGEROUS",
+        "HARM_CATEGORY_HARASSMENT",
+        "HARM_CATEGORY_HATE_SPEECH",
+        "HARM_CATEGORY_SEXUALLY_EXPLICIT",
+    ],
+    info=(
+        "The category of a rating."
+        "These categories cover various kinds of harms that developers may wish to adjust."
+    ),
+    multiselect=True,
+)
+threshold_dropdown_component = gr.Dropdown(
+    label="Threshold",
+    choices=[
+        "BLOCK_LOW_AND_ABOVE",
+        "BLOCK_MEDIUM_AND_ABOVE",
+        "BLOCK_ONLY_HIGH",
+        "BLOCK_NONE",
+    ],
+    value="BLOCK_NONE",
+    info=("Block at and beyond a specified harm probability."),
+)
+user_inputs = [text_prompt_component, chatbot_component]
 bot_inputs = [
     google_key_component,
     stop_sequences_component,
     top_k_component,
     top_p_component,
+    category_dropdown_component,
+    threshold_dropdown_component,
+    chatbot_component,
 ]
 with gr.Blocks() as demo:
         chatbot_component.render()
         with gr.Row():
             text_prompt_component.render()
+            clear_component = gr.ClearButton([text_prompt_component, chatbot_component])
             upload_button_component.render()
             run_button_component.render()
         with gr.Accordion("Parameters", open=False):
             temperature_component.render()
             max_output_tokens_component.render()
             stop_sequences_component.render()
+            with gr.Accordion("Safe Setting", open=False):
+                category_dropdown_component.render()
+                threshold_dropdown_component.render()
             with gr.Accordion("Advanced", open=False):
                 top_k_component.render()
                 top_p_component.render()
         fn=user,
         inputs=user_inputs,
         outputs=[text_prompt_component, chatbot_component],
+        queue=False,
     ).then(
+        fn=bot,
+        inputs=bot_inputs,
+        outputs=[chatbot_component],
     )
     text_prompt_component.submit(
         fn=user,
         inputs=user_inputs,
         outputs=[text_prompt_component, chatbot_component],
+        queue=False,
     ).then(
+        fn=bot,
+        inputs=bot_inputs,
+        outputs=[chatbot_component],
     )
     upload_button_component.upload(
         fn=upload,
         inputs=[upload_button_component, chatbot_component],
         outputs=[chatbot_component],
+        queue=False,
     )
 demo.queue(max_size=99).launch(debug=False, show_error=True)