Spaces:

eaysu
/

Voice-Cloning-Multilingual

Runtime error

App Files Files Community

eaysu commited on 21 days ago

Commit

1445567

1 Parent(s): 94306c5

initial commit

Browse files

Files changed (3) hide show

.DS_Store +0 -0
app.py +59 -0
requirements.txt +4 -0

.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

app.py ADDED Viewed

	@@ -0,0 +1,59 @@

+import torch
+from TTS.api import TTS
+import gradio as gr
+import soundfile as sf
+import numpy as np
+# Get device
+device = "cuda" if torch.cuda.is_available() else "cpu"
+# Initialize TTS model
+tts = TTS("tts_models/multilingual/multi-dataset/xtts_v2").to(device)
+# Define available languages
+AVAILABLE_LANGUAGES = ["en", "de", "fr", "it", "es", "tr"]
+# Function to generate cloned voice
+def clone_voice(text, language, speaker_wav):
+    # Ensure the language is supported
+    if language not in AVAILABLE_LANGUAGES:
+        raise ValueError(f"Language '{language}' is not supported. Available languages: {AVAILABLE_LANGUAGES}")
+    # Generate speech
+    wav = tts.tts(text=text, speaker_wav=speaker_wav, language=language)
+    # Save the output to a temporary file
+    output_file = "output.wav"
+    sf.write(output_file, wav, 22050)
+    return output_file
+# Gradio interface
+def gradio_interface(text, language, speaker_wav):
+    try:
+        output_file = clone_voice(text, language, speaker_wav)
+        return output_file
+    except Exception as e:
+        return str(e)
+# Define Gradio inputs and outputs
+inputs = [
+    gr.Textbox(label="Text to speak", placeholder="Enter text here..."),
+    gr.Dropdown(label="Language", choices=AVAILABLE_LANGUAGES, value="en"),
+    gr.Audio(label="Reference Voice (Upload or Record)", type="filepath"),
+]
+outputs = gr.Audio(label="Cloned Voice Output")
+# Create Gradio interface
+interface = gr.Interface(
+    fn=gradio_interface,
+    inputs=inputs,
+    outputs=outputs,
+    title="Voice Cloning with Coqui TTS",
+    description="Upload or record a reference voice, enter text, and select a language to generate a cloned voice.",
+    live=False,
+)
+# Launch the interface
+interface.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+torch
+TTS
+gradio
+soundfile