xaman4

Running

App Files Files Community

salomonsky commited on Jan 20, 2024

Commit

b39afbd

verified ·

1 Parent(s): 8438d4f

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -20

app.py CHANGED Viewed

@@ -15,6 +15,7 @@ def recognize_speech(audio_data, show_messages=True):
     audio_recording = sr.AudioFile(audio_data)
     with audio_recording as source:
         audio = recognizer.record(source)
     try:
@@ -24,7 +25,7 @@ def recognize_speech(audio_data, show_messages=True):
             st.write(audio_text)
             st.success("Reconocimiento de voz completado.")
     except sr.UnknownValueError:
-        st.warning("No se pudo reconocer el audio.")
         audio_text = ""
     except sr.RequestError:
         st.error("Hablame para comenzar!")
@@ -82,25 +83,17 @@ def text_to_speech(text, speed=1.3):
     modified_audio_fp.seek(0)
     return modified_audio_fp
-def main():
-    st.title("Chatbot de Voz a Voz")
-    microphones = sr.Microphone.list_microphone_names()
-    if microphones:
-        selected_microphone_index = 0
-        audio_data = sr.Microphone(device_index=selected_microphone_index)
-    else:
-        st.warning("No se encontraron dispositivos.")
-    if not audio_data.empty():
-        st.audio(audio_data.export().read(), format="audio/wav")
-        audio_data.export("audio.wav", format="wav")
-        audio_text = recognize_speech("audio.wav")
-        if audio_text:
-            output, audio_file = generate(audio_text, history=st.session_state.history)
-            if audio_text:
-                st.session_state.history.append((audio_text, output))
             if audio_file is not None:
                 st.markdown(
@@ -110,5 +103,23 @@ def main():
                     unsafe_allow_html=True
                 )
 if __name__ == "__main__":
-    main()

     audio_recording = sr.AudioFile(audio_data)
     with audio_recording as source:
+        recognizer.adjust_for_ambient_noise(source)  # Ajuste para el ruido ambiente
         audio = recognizer.record(source)
     try:
             st.write(audio_text)
             st.success("Reconocimiento de voz completado.")
     except sr.UnknownValueError:
+        st.warning("No se pudo reconocer el audio. ¿Intentaste grabar algo?")
         audio_text = ""
     except sr.RequestError:
         st.error("Hablame para comenzar!")
     modified_audio_fp.seek(0)
     return modified_audio_fp
+def background_listener(recognizer, source):
+    while True:
+        try:
+            audio_text = recognizer.recognize_google(recognizer.listen(source), language="es-ES")
+            st.subheader("Texto Reconocido:")
+            st.write(audio_text)
+            st.success("Reconocimiento de voz completado.")
+            output, audio_file = generate(audio_text, history=st.session_state.history)
+            if audio_text:
+                st.session_state.history.append((audio_text, output))
             if audio_file is not None:
                 st.markdown(
                     unsafe_allow_html=True
                 )
+        except sr.UnknownValueError:
+            pass  # Ignore if nothing is recognized
+        except sr.RequestError:
+            st.error("Error de solicitud. Asegúrate de tener una conexión a Internet.")
+def main():
+    st.title("Chatbot de Voz a Voz")
+    recognizer = sr.Recognizer()
+    microphone = sr.Microphone()
+    with microphone as source:
+        recognizer.adjust_for_ambient_noise(source)  # Ajuste inicial para el ruido ambiente
+    st.warning("Escuchando en segundo plano. Puedes hablar en cualquier momento.")
+    stop_listening = recognizer.listen_in_background(microphone, background_listener)
+    st.button("Detener Escucha", on_click=stop_listening)
 if __name__ == "__main__":
+    main()