IT2091024v2

Paused

Pijush2023 commited on Aug 29, 2024

Commit

3791d11

verified ·

1 Parent(s): 5feca2f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,20 +1,3 @@
-import subprocess
-import sys
-# Install the PortAudio library
-try:
-    subprocess.run(["apt-get", "install", "-y", "portaudio19-dev"], check=True)
-except subprocess.CalledProcessError as e:
-    print(f"Error occurred while installing PortAudio: {e}")
-    sys.exit(1)
-# Now import sounddevice
-try:
-    import sounddevice as sd
-except OSError as e:
-    print(f"Failed to import sounddevice: {e}")
-    sys.exit(1)
 import gradio as gr
 import requests
 import os
@@ -806,14 +789,18 @@ def generate_audio_parler_tts(text):
         for new_audio in streamer:
             if new_audio.shape[0] == 0:
                 break
-            # Real-time playback of the audio chunk
-            sd.play(new_audio, samplerate=sampling_rate)
-            sd.wait()  # Wait until the audio is played before moving to the next chunk
             yield sampling_rate, new_audio
     audio_segments = []
     for (sampling_rate, audio_chunk) in generate(text, description, chunk_size_in_s):
         audio_segments.append(audio_chunk)
     # Combine all the audio chunks into one audio file
     combined_audio = np.concatenate(audio_segments)
@@ -821,7 +808,7 @@ def generate_audio_parler_tts(text):
     write_wav(combined_audio_path, sampling_rate, combined_audio.astype(np.float32))
-    logging.debug(f"Audio saved to {combined_audio_path}")
     return combined_audio_path

 import gradio as gr
 import requests
 import os
         for new_audio in streamer:
             if new_audio.shape[0] == 0:
                 break
+            # Save or process each audio chunk as it is generated
             yield sampling_rate, new_audio
     audio_segments = []
     for (sampling_rate, audio_chunk) in generate(text, description, chunk_size_in_s):
         audio_segments.append(audio_chunk)
+        # Here, you can save the chunk to a file or send it to a frontend
+        # For example, you could write the chunk to a file immediately:
+        temp_audio_path = os.path.join(tempfile.gettempdir(), f"parler_tts_audio_chunk_{len(audio_segments)}.wav")
+        write_wav(temp_audio_path, sampling_rate, audio_chunk.astype(np.float32))
+        logging.debug(f"Saved chunk to {temp_audio_path}")
+        # You could also send the chunk to a web client if this was a web application
     # Combine all the audio chunks into one audio file
     combined_audio = np.concatenate(audio_segments)
     write_wav(combined_audio_path, sampling_rate, combined_audio.astype(np.float32))
+    logging.debug(f"Combined audio saved to {combined_audio_path}")
     return combined_audio_path