Spaces:

EnzoBustos
/

TuringVideos

Sleeping

EnzoBustos commited on Dec 8, 2023

Commit

7732184

1 Parent(s): 3650db9

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,10 +18,12 @@ st.set_page_config(
 )
 #@st.cache_resource
-#@st.cache_data
 def download_audio(link):
-    with yt_dlp.YoutubeDL({'extract_audio': True, 'format': 'bestaudio', 'outtmpl': 'video.mp3'}) as video:
-        video.download(link)
 #Load Whisper pipeline via HuggingFace
 @st.cache_resource
@@ -54,7 +56,7 @@ def load_nltk():
 #Make the ASR task
 @st.cache_data
-def audio_speech_recognition(_model_pipeline, video="video.mp3"):
     return _model_pipeline(video, batch_size=64)["text"].strip()
 #Make the Summarization task
@@ -120,7 +122,7 @@ def main():
             with st.spinner("Carregando modelos..."):
                 if language == "Inglês (en)":
-                    download_audio(link)
                     load_nltk()
                     whisper = load_whisper()
                     extractive = load_extractive()
@@ -133,7 +135,7 @@ def main():
                     st.header("Erro na seleção de linguagem.")
             with st.spinner("Transcrevendo texto..."):
-                transcript_text = audio_speech_recognition(whisper)
             with model_1:
                 st.header("Texto Sumarizado:")

 )
 #@st.cache_resource
 def download_audio(link):
+    with yt_dlp.YoutubeDL({'extract_audio': True, 'format': 'bestaudio', 'outtmpl': '%(id)s.mp3'}) as video:
+        info_dict = video.extract_info(link, download = True)
+        id = info_dict['id']
+        video.download(link)
+        return id
 #Load Whisper pipeline via HuggingFace
 @st.cache_resource
 #Make the ASR task
 @st.cache_data
+def audio_speech_recognition(_model_pipeline, video_id):
     return _model_pipeline(video, batch_size=64)["text"].strip()
 #Make the Summarization task
             with st.spinner("Carregando modelos..."):
                 if language == "Inglês (en)":
+                    id = download_audio(link)
                     load_nltk()
                     whisper = load_whisper()
                     extractive = load_extractive()
                     st.header("Erro na seleção de linguagem.")
             with st.spinner("Transcrevendo texto..."):
+                transcript_text = audio_speech_recognition(whisper, id)
             with model_1:
                 st.header("Texto Sumarizado:")