Spaces:

mgokg
/

gemini-2.0-flash-exp

Running

App Files Files Community

mgokg commited on Jan 14

Commit

0a61873

verified ·

1 Parent(s): 7405511

Update app.py

Browse files

Files changed (1) hide show

app.py +51 -2

app.py CHANGED Viewed

@@ -4,7 +4,7 @@ import os
 import json
 import google.generativeai as genai
 from bs4 import BeautifulSoup
 # Load environment variables
 genai.configure(api_key=os.environ["geminiapikey"])
 read_key = os.environ.get('HF_TOKEN', None)
@@ -20,6 +20,16 @@ custom_css = """
 }
 """
 def predict(prompt):
     generation_config = {
       "temperature": 0.4,
@@ -54,7 +64,43 @@ def websearch(search_term):
     prompt = f"{search_term}\n use this result from a google search to answer the question \n {response_text.text}"
     result = predict(prompt)
     return result
 # Create the Gradio interface
 with gr.Blocks(css=custom_css) as demo:
     with gr.Row():
@@ -69,4 +115,7 @@ with gr.Blocks(css=custom_css) as demo:
     button.click(fn=websearch, inputs=ort_input, outputs=details_output)
 # Launch the Gradio application
-demo.launch()

 import json
 import google.generativeai as genai
 from bs4 import BeautifulSoup
+from groq import Groq
 # Load environment variables
 genai.configure(api_key=os.environ["geminiapikey"])
 read_key = os.environ.get('HF_TOKEN', None)
 }
 """
+api_key = os.getenv('groq_whisper')
+if api_key is None:
+    raise ValueError("groq_whisper environment variable is not set")
+# Initialize the Groq client
+client = Groq(api_key=api_key)
 def predict(prompt):
     generation_config = {
       "temperature": 0.4,
     prompt = f"{search_term}\n use this result from a google search to answer the question \n {response_text.text}"
     result = predict(prompt)
     return result
+def process_audio(file_path):
+    try:
+        # Open the audio file
+        with open(file_path, "rb") as file:
+            # Create a translation of the audio file
+            translation = client.audio.transcriptions.create(
+                file=(os.path.basename(file_path), file.read()),  # Correct passing of filename
+                model="whisper-large-v3-turbo",  # Required model to use for translation
+                prompt="transcribe",  # Optional
+                language="de",  # Optional
+                response_format="json",  # Optional
+                temperature=0.0  # Optional
+            )
+            # Return the translation text
+            suche = websearch(translation.text)
+            result = predict(suche)
+            return result
+            return translation.text
+    except Exception as e:
+        return f"An error occurred: {str(e)}"
+with gr.Blocks() as speech:
+    with gr.Row():
+        sr_outputs = gr.Textbox(label="Antwort")
+    with gr.Row():
+        sr_inputs = gr.Microphone(type="filepath")
+    sr_inputs.change(process_audio, inputs=sr_inputs, outputs=sr_outputs)
+speech.launch()
+"""
 # Create the Gradio interface
 with gr.Blocks(css=custom_css) as demo:
     with gr.Row():
     button.click(fn=websearch, inputs=ort_input, outputs=details_output)
 # Launch the Gradio application
+demo.launch()
+"""