xaman4

Sleeping

App Files Files Community

salomonsky commited on Jan 13, 2024

Commit

d843813

verified ·

1 Parent(s): b0b5cd6

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -55

app.py CHANGED Viewed

@@ -1,11 +1,7 @@
 import streamlit as st
-from huggingface_hub import InferenceClient
-from gtts import gTTS
-import base64
 import speech_recognition as sr
 from pydub import AudioSegment
 from pydub.playback import play
-import pyaudio
 from io import BytesIO
 from time import sleep
@@ -62,7 +58,6 @@ def generate_with_progress(
         response += response_token.token.text
         total_tokens += 1
-        # Actualizar la barra de progreso
         st.subheader("Generando respuesta...")
         st.progress(total_tokens / max_new_tokens)
@@ -70,56 +65,37 @@ def generate_with_progress(
     return response
-# Configuración para la entrada de voz
-with st.form("voice_input_form"):
-    st.write("Haz clic en el botón para iniciar la grabación de voz:")
-    start_recording_button = st.form_submit_button("Iniciar Grabación")
-# Inicializar historial si no existe
 if "history" not in st.session_state:
     st.session_state.history = []
-# Verificar si se hace clic en el botón de grabación
-if start_recording_button:
-    st.info("Habla ahora...")
-    audio_data = BytesIO()
-    p = pyaudio.PyAudio()
-    stream = p.open(format=pyaudio.paInt16, channels=1, rate=44100, input=True, frames_per_buffer=1024)
-    with st.spinner("Grabando..."):
-        frames = []
-        for i in range(int(44100 / 1024 * 5)):  # grabar durante 5 segundos
-            data = stream.read(1024)
-            frames.append(data)
-    stream.stop_stream()
-    stream.close()
-    p.terminate()
-    recognizer = sr.Recognizer()
-    try:
-        audio_data.write(b''.join(frames))
-        audio_data.seek(0)
-        audio = AudioSegment.from_file(audio_data, format="wav")
-        text = recognizer.recognize_google(audio, language="es-ES")
-        st.success(f"Texto reconocido: {text}")
-        generate_progress = st.empty()
-        generate_progress.progress(0.0)
-        output = generate_with_progress(text, history=st.session_state.history)
-        st.session_state.history.append((text, output))
-        st.success("Respuesta generada con éxito.")
-        st.subheader("Reproduciendo respuesta...")
-        audio_file_path = text_to_speech(output)
-        play(audio_file_path)
-        for progress_value in range(0, 101, 10):
-            st.progress(progress_value / 100)
-            sleep(0.5)
-    except sr.UnknownValueError:
-        st.warning("No se pudo reconocer el habla.")
-    except sr.RequestError as e:
-        st.error(f"Error en la solicitud al servicio de reconocimiento de voz: {e}")

 import streamlit as st
 import speech_recognition as sr
 from pydub import AudioSegment
 from pydub.playback import play
 from io import BytesIO
 from time import sleep
         response += response_token.token.text
         total_tokens += 1
         st.subheader("Generando respuesta...")
         st.progress(total_tokens / max_new_tokens)
     return response
 if "history" not in st.session_state:
     st.session_state.history = []
+recognizer = sr.Recognizer()
+while True:
+    with st.spinner("Escuchando..."):
+        try:
+            with sr.Microphone() as source:
+                audio_data = recognizer.listen(source, timeout=5)
+            st.success("Audio capturado con éxito.")
+            text = recognizer.recognize_google(audio_data, language="es-ES")
+            st.success(f"Texto reconocido: {text}")
+            st.subheader("Generando respuesta...")
+            st.progress(0.0)
+            output = generate_with_progress(text, history=st.session_state.history)
+            st.session_state.history.append((text, output))
+            st.success("Respuesta generada con éxito.")
+            st.subheader("Reproduciendo respuesta...")
+            audio_file_path = text_to_speech(output)
+            play(audio_file_path)
+            for progress_value in range(0, 101, 10):
+                st.progress(progress_value / 100)
+                sleep(0.5)
+        except sr.UnknownValueError:
+            st.warning("No se pudo reconocer el habla.")
+        except sr.RequestError as e:
+            st.error(f"Error en la solicitud al servicio de reconocimiento de voz: {e}")
+            break