ollieollie's picture
update app.py
c30668f
raw
history blame
855 Bytes
from orator.src.orator.tts import OratorTTS
import gradio as gr
model = OratorTTS.from_pretrained("cuda")
def generate(text, audio_prompt_path, exaggeration, pace, temperature):
wav = model.generate(
text, audio_prompt_path=audio_prompt_path,
exaggeration=exaggeration,
pace=pace,
temperature=temperature,
)
return 24000, wav.squeeze(0).numpy()
demo = gr.Interface(
generate,
[
gr.Textbox(value="", label="Text to synthesize"),
gr.Audio(sources="upload", type="filepath", label="Reference Audio File", value=None),
gr.Slider(-5, 5, step=.05, label="exaggeration", value=.5),
gr.Slider(0.8, 1.2, step=.01, label="pace", value=1),
gr.Slider(0.05, 5, step=.05, label="temperature", value=.8),
],
"audio",
)
if __name__ == "__main__":
demo.launch()