from orator.src.orator.tts import OratorTTS
import gradio as gr


model = OratorTTS.from_pretrained("cuda")


def generate(text, audio_prompt_path, emotion_adv):
    wav = model.generate(text, audio_prompt_path=audio_prompt_path, emotion_adv=emotion_adv)
    return 24000, wav.squeeze(0).numpy()

demo = gr.Interface(
    generate,
    [
        gr.Textbox(value="What does the fox say?", label="Text to synthesize"),
        gr.Audio(sources="upload", type="filepath", label="Input Audio File"),
        gr.Slider(0, 1, step=.05, label="emotion_adv", value=.5),
    ],
    "audio",
)

if __name__ == "__main__":
    demo.launch()