Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -2,7 +2,6 @@ import torch
|
|
2 |
import torchaudio
|
3 |
from torchaudio.transforms import Resample
|
4 |
from transformers import Speech2TextProcessor, Speech2TextForConditionalGeneration
|
5 |
-
from audio_recorder_streamlit import audio_recorder
|
6 |
import streamlit as st
|
7 |
|
8 |
def preprocess_audio(audio_bytes, sample_rate=16000):
|
@@ -26,7 +25,7 @@ def transcribe_audio(audio_bytes):
|
|
26 |
input_features = preprocess_audio(audio_bytes)
|
27 |
|
28 |
# Tokenize audio
|
29 |
-
inputs = processor(input_features, return_tensors="pt", padding=True)
|
30 |
|
31 |
# Generate transcription
|
32 |
generated_ids = model.generate(inputs.input_features)
|
@@ -34,16 +33,21 @@ def transcribe_audio(audio_bytes):
|
|
34 |
|
35 |
return translation
|
36 |
|
37 |
-
st.title("Audio to Text Transcription
|
38 |
-
audio_bytes = audio_recorder(pause_threshold=3.0, sample_rate=16000)
|
39 |
-
if audio_bytes:
|
40 |
-
st.audio(audio_bytes, format="audio/wav")
|
41 |
|
|
|
|
|
|
|
|
|
|
|
|
|
42 |
transcription = transcribe_audio(audio_bytes)
|
|
|
43 |
if transcription:
|
44 |
st.write("Transcription:")
|
45 |
-
st.write(transcription)
|
46 |
else:
|
47 |
st.write("Error: Failed to transcribe audio.")
|
48 |
else:
|
49 |
-
st.write("
|
|
|
|
2 |
import torchaudio
|
3 |
from torchaudio.transforms import Resample
|
4 |
from transformers import Speech2TextProcessor, Speech2TextForConditionalGeneration
|
|
|
5 |
import streamlit as st
|
6 |
|
7 |
def preprocess_audio(audio_bytes, sample_rate=16000):
|
|
|
25 |
input_features = preprocess_audio(audio_bytes)
|
26 |
|
27 |
# Tokenize audio
|
28 |
+
inputs = processor(input_features.squeeze(0), return_tensors="pt", padding=True)
|
29 |
|
30 |
# Generate transcription
|
31 |
generated_ids = model.generate(inputs.input_features)
|
|
|
33 |
|
34 |
return translation
|
35 |
|
36 |
+
st.title("Audio to Text Transcription")
|
|
|
|
|
|
|
37 |
|
38 |
+
uploaded_file = st.file_uploader("Upload audio file", type=["wav"])
|
39 |
+
|
40 |
+
if uploaded_file is not None:
|
41 |
+
st.audio(uploaded_file, format="audio/wav")
|
42 |
+
|
43 |
+
audio_bytes = uploaded_file.getvalue()
|
44 |
transcription = transcribe_audio(audio_bytes)
|
45 |
+
|
46 |
if transcription:
|
47 |
st.write("Transcription:")
|
48 |
+
st.write(transcription[0])
|
49 |
else:
|
50 |
st.write("Error: Failed to transcribe audio.")
|
51 |
else:
|
52 |
+
st.write("Please upload an audio file.")
|
53 |
+
|