shukdevdatta123 commited on
Commit
3e2d79c
·
verified ·
1 Parent(s): 8974aa3

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +111 -52
app.py CHANGED
@@ -51,60 +51,119 @@ def transcribe_audio(audio_file):
51
  return "Could not request results from Google Speech Recognition service."
52
 
53
  # Streamlit app layout
54
- st.title("Video to Audio to Text Transcription")
55
- st.write("Upload a video file, and it will be converted to audio and transcribed into text.")
56
-
57
- # File uploader for video
58
- uploaded_video = st.file_uploader("Upload Video", type=["mp4", "mov", "avi"])
59
-
60
- if uploaded_video is not None:
61
- # Save the uploaded video file temporarily
62
- with tempfile.NamedTemporaryFile(delete=False) as tmp_video:
63
- tmp_video.write(uploaded_video.read())
64
- tmp_video_path = tmp_video.name
65
-
66
- # Add an "Analyze Video" button
67
- if st.button("Analyze Video"):
68
- with st.spinner("Processing video... Please wait."):
69
- # Convert video to audio
70
- audio_file = video_to_audio(tmp_video_path)
71
-
72
- # Convert the extracted MP3 audio to WAV
73
- wav_audio_file = convert_mp3_to_wav(audio_file)
74
-
75
- # Transcribe audio to text
76
- transcription = transcribe_audio(wav_audio_file)
77
 
78
- # Show the transcription
79
- st.text_area("Transcription", transcription, height=300)
80
 
81
- # Store transcription and audio file in session state
82
- st.session_state.transcription = transcription
83
- st.session_state.wav_audio_file = wav_audio_file
84
 
85
- # Cleanup temporary files
86
- os.remove(tmp_video_path)
87
- os.remove(audio_file)
 
 
88
 
89
- # Check if transcription and audio file are stored in session state
90
- if 'transcription' in st.session_state and 'wav_audio_file' in st.session_state:
91
- # Provide the audio file to the user for download
92
- st.audio(st.session_state.wav_audio_file, format='audio/wav')
93
-
94
- # Add download buttons for the transcription and audio
95
- # Downloadable transcription file
96
- st.download_button(
97
- label="Download Transcription",
98
- data=st.session_state.transcription,
99
- file_name="transcription.txt",
100
- mime="text/plain"
101
- )
102
-
103
- # Downloadable audio file
104
- with open(st.session_state.wav_audio_file, "rb") as audio_file_data:
 
 
 
 
 
 
 
 
 
 
 
 
 
 
105
  st.download_button(
106
- label="Download Audio",
107
- data=audio_file_data,
108
- file_name="converted_audio.wav",
109
- mime="audio/wav"
110
- )
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
51
  return "Could not request results from Google Speech Recognition service."
52
 
53
  # Streamlit app layout
54
+ st.title("Video and Audio to Text Transcription")
55
+ st.write("Upload a video or audio file to convert it to transcription.")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
56
 
57
+ # Create tabs to separate video and audio uploads
58
+ tab = st.selectbox("Select the type of file to upload", ["Video", "Audio"])
59
 
60
+ if tab == "Video":
61
+ # File uploader for video
62
+ uploaded_video = st.file_uploader("Upload Video", type=["mp4", "mov", "avi"])
63
 
64
+ if uploaded_video is not None:
65
+ # Save the uploaded video file temporarily
66
+ with tempfile.NamedTemporaryFile(delete=False) as tmp_video:
67
+ tmp_video.write(uploaded_video.read())
68
+ tmp_video_path = tmp_video.name
69
 
70
+ # Add an "Analyze Video" button
71
+ if st.button("Analyze Video"):
72
+ with st.spinner("Processing video... Please wait."):
73
+ # Convert video to audio
74
+ audio_file = video_to_audio(tmp_video_path)
75
+
76
+ # Convert the extracted MP3 audio to WAV
77
+ wav_audio_file = convert_mp3_to_wav(audio_file)
78
+
79
+ # Transcribe audio to text
80
+ transcription = transcribe_audio(wav_audio_file)
81
+
82
+ # Show the transcription
83
+ st.text_area("Transcription", transcription, height=300)
84
+
85
+ # Store transcription and audio file in session state
86
+ st.session_state.transcription = transcription
87
+ st.session_state.wav_audio_file = wav_audio_file
88
+
89
+ # Cleanup temporary files
90
+ os.remove(tmp_video_path)
91
+ os.remove(audio_file)
92
+
93
+ # Check if transcription and audio file are stored in session state
94
+ if 'transcription' in st.session_state and 'wav_audio_file' in st.session_state:
95
+ # Provide the audio file to the user for download
96
+ st.audio(st.session_state.wav_audio_file, format='audio/wav')
97
+
98
+ # Add download buttons for the transcription and audio
99
+ # Downloadable transcription file
100
  st.download_button(
101
+ label="Download Transcription",
102
+ data=st.session_state.transcription,
103
+ file_name="transcription.txt",
104
+ mime="text/plain"
105
+ )
106
+
107
+ # Downloadable audio file
108
+ with open(st.session_state.wav_audio_file, "rb") as audio_file_data:
109
+ st.download_button(
110
+ label="Download Audio",
111
+ data=audio_file_data,
112
+ file_name="converted_audio.wav",
113
+ mime="audio/wav"
114
+ )
115
+
116
+ elif tab == "Audio":
117
+ # File uploader for audio
118
+ uploaded_audio = st.file_uploader("Upload Audio", type=["wav", "mp3"])
119
+
120
+ if uploaded_audio is not None:
121
+ # Save the uploaded audio file temporarily
122
+ with tempfile.NamedTemporaryFile(delete=False) as tmp_audio:
123
+ tmp_audio.write(uploaded_audio.read())
124
+ tmp_audio_path = tmp_audio.name
125
+
126
+ # Add an "Analyze Audio" button
127
+ if st.button("Analyze Audio"):
128
+ with st.spinner("Processing audio... Please wait."):
129
+ # Convert audio to WAV if it's in MP3 format
130
+ if uploaded_audio.type == "audio/mpeg":
131
+ wav_audio_file = convert_mp3_to_wav(tmp_audio_path)
132
+ else:
133
+ wav_audio_file = tmp_audio_path
134
+
135
+ # Transcribe audio to text
136
+ transcription = transcribe_audio(wav_audio_file)
137
+
138
+ # Show the transcription
139
+ st.text_area("Transcription", transcription, height=300)
140
+
141
+ # Store transcription in session state
142
+ st.session_state.transcription_audio = transcription
143
+ st.session_state.wav_audio_file_audio = wav_audio_file
144
+
145
+ # Cleanup temporary audio file
146
+ os.remove(tmp_audio_path)
147
+
148
+ # Check if transcription and audio file are stored in session state
149
+ if 'transcription_audio' in st.session_state and 'wav_audio_file_audio' in st.session_state:
150
+ # Provide the audio file to the user for download
151
+ st.audio(st.session_state.wav_audio_file_audio, format='audio/wav')
152
+
153
+ # Add download buttons for the transcription and audio
154
+ # Downloadable transcription file
155
+ st.download_button(
156
+ label="Download Transcription",
157
+ data=st.session_state.transcription_audio,
158
+ file_name="transcription_audio.txt",
159
+ mime="text/plain"
160
+ )
161
+
162
+ # Downloadable audio file
163
+ with open(st.session_state.wav_audio_file_audio, "rb") as audio_file_data:
164
+ st.download_button(
165
+ label="Download Audio",
166
+ data=audio_file_data,
167
+ file_name="converted_audio_audio.wav",
168
+ mime="audio/wav"
169
+ )