|
import streamlit as st |
|
from transformers import pipeline |
|
|
|
|
|
tts_model = pipeline("text-to-speech", model="espnet/kan-bayashi_ljspeech_vits") |
|
|
|
|
|
st.title("Text-to-Audio App") |
|
st.text("This app generates audio from text input using Hugging Face models.") |
|
|
|
|
|
text_input = st.text_area("Enter some text for the model:") |
|
|
|
if st.button("Generate Audio"): |
|
if not text_input.strip(): |
|
st.error("Please enter some text!") |
|
else: |
|
|
|
st.text("Generating audio response...") |
|
tts_audio = tts_model(text_input) |
|
|
|
|
|
audio_file = "response.wav" |
|
with open(audio_file, "wb") as f: |
|
f.write(tts_audio["wav"]) |
|
|
|
|
|
st.audio(audio_file, format="audio/wav") |
|
st.success("Audio generated successfully!") |
|
|
|
|