pratikshahp commited on
Commit
e63c494
·
verified ·
1 Parent(s): 6daa843

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -8
app.py CHANGED
@@ -2,7 +2,6 @@ import torch
2
  import torchaudio
3
  from torchaudio.transforms import Resample
4
  from transformers import Speech2TextProcessor, Speech2TextForConditionalGeneration
5
- from audio_recorder_streamlit import audio_recorder
6
  import streamlit as st
7
 
8
  def preprocess_audio(audio_bytes, sample_rate=16000):
@@ -26,7 +25,7 @@ def transcribe_audio(audio_bytes):
26
  input_features = preprocess_audio(audio_bytes)
27
 
28
  # Tokenize audio
29
- inputs = processor(input_features, return_tensors="pt", padding=True)
30
 
31
  # Generate transcription
32
  generated_ids = model.generate(inputs.input_features)
@@ -34,16 +33,21 @@ def transcribe_audio(audio_bytes):
34
 
35
  return translation
36
 
37
- st.title("Audio to Text Transcription..")
38
- audio_bytes = audio_recorder(pause_threshold=3.0, sample_rate=16000)
39
- if audio_bytes:
40
- st.audio(audio_bytes, format="audio/wav")
41
 
 
 
 
 
 
 
42
  transcription = transcribe_audio(audio_bytes)
 
43
  if transcription:
44
  st.write("Transcription:")
45
- st.write(transcription)
46
  else:
47
  st.write("Error: Failed to transcribe audio.")
48
  else:
49
- st.write("No audio recorded.")
 
 
2
  import torchaudio
3
  from torchaudio.transforms import Resample
4
  from transformers import Speech2TextProcessor, Speech2TextForConditionalGeneration
 
5
  import streamlit as st
6
 
7
  def preprocess_audio(audio_bytes, sample_rate=16000):
 
25
  input_features = preprocess_audio(audio_bytes)
26
 
27
  # Tokenize audio
28
+ inputs = processor(input_features.squeeze(0), return_tensors="pt", padding=True)
29
 
30
  # Generate transcription
31
  generated_ids = model.generate(inputs.input_features)
 
33
 
34
  return translation
35
 
36
+ st.title("Audio to Text Transcription")
 
 
 
37
 
38
+ uploaded_file = st.file_uploader("Upload audio file", type=["wav"])
39
+
40
+ if uploaded_file is not None:
41
+ st.audio(uploaded_file, format="audio/wav")
42
+
43
+ audio_bytes = uploaded_file.getvalue()
44
  transcription = transcribe_audio(audio_bytes)
45
+
46
  if transcription:
47
  st.write("Transcription:")
48
+ st.write(transcription[0])
49
  else:
50
  st.write("Error: Failed to transcribe audio.")
51
  else:
52
+ st.write("Please upload an audio file.")
53
+