Spaces:

Tonic
/

whisperspeech

Runtime error

Tonic commited on Jan 29, 2024

Commit

18de3a6

verified ·

1 Parent(s): f7fa40e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -39,9 +39,13 @@ def parse_multilingual_text(input_text):
 @spaces.GPU
 def generate_segment_audio(text, lang, speaker_url, pipe):
     if not isinstance(text, str):
         text = text.decode("utf-8") if isinstance(text, bytes) else str(text)
-    audio_data = pipe.generate(text, speaker_url, lang)
     resample_audio = resampler(newsr=24000)
     audio_data_resampled = next(resample_audio([{'sample_rate': 24000, 'samples': audio_data.cpu()}]))['samples_24k']
     audio_np = audio_data_resampled.cpu().numpy()

 @spaces.GPU
 def generate_segment_audio(text, lang, speaker_url, pipe):
     if not isinstance(text, str):
+        print("Speaker Audio Type:", type(speaker_audio))
+        with open(speaker_audio, 'rb') as file:
+            speaker_audio = file.read()
         text = text.decode("utf-8") if isinstance(text, bytes) else str(text)
+    audio_data = pipe.generate(text, speaker_audio, lang)
     resample_audio = resampler(newsr=24000)
     audio_data_resampled = next(resample_audio([{'sample_rate': 24000, 'samples': audio_data.cpu()}]))['samples_24k']
     audio_np = audio_data_resampled.cpu().numpy()