Spaces:

tufailnewuse
/

speech_to_text

Running

tufailnewuse commited on Nov 9, 2024

Commit

bbafd1c

verified ·

1 Parent(s): 373aa9e

Create app.py

Files changed (1) hide show

app.py ADDED Viewed

+import streamlit as st
+from transformers import pipeline
+import soundfile as sf
+import tempfile
+# Load the ASR model from Hugging Face
+@st.cache_resource
+def load_model():
+    # Use Hugging Face's pipeline with your desired model
+    return pipeline("automatic-speech-recognition", model="fractalego/personal-speech-to-text-model")
+# Initialize the model pipeline
+pipe = load_model()
+# Streamlit UI
+st.title("Speech-to-Text Transcription App")
+st.write("Upload an audio file, and the AI model will transcribe it.")
+# Upload audio file
+uploaded_file = st.file_uploader("Choose an audio file", type=["wav", "mp3", "m4a"])
+if uploaded_file is not None:
+    st.audio(uploaded_file, format='audio/wav')
+    # Save uploaded file to a temporary location
+    with tempfile.NamedTemporaryFile(delete=False) as temp_file:
+        temp_file.write(uploaded_file.read())
+        temp_file_path = temp_file.name
+    # Read the audio file and transcribe
+    with st.spinner("Transcribing... Please wait..."):
+        transcription = pipe(temp_file_path)
+    # Display the transcription result
+    st.subheader("Transcription")
+    st.write(transcription['text'])
+else:
+    st.info("Please upload an audio file to start transcription.")