EnzoBustos commited on
Commit
7732184
·
1 Parent(s): 3650db9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -6
app.py CHANGED
@@ -18,10 +18,12 @@ st.set_page_config(
18
  )
19
 
20
  #@st.cache_resource
21
- #@st.cache_data
22
  def download_audio(link):
23
- with yt_dlp.YoutubeDL({'extract_audio': True, 'format': 'bestaudio', 'outtmpl': 'video.mp3'}) as video:
24
- video.download(link)
 
 
 
25
 
26
  #Load Whisper pipeline via HuggingFace
27
  @st.cache_resource
@@ -54,7 +56,7 @@ def load_nltk():
54
 
55
  #Make the ASR task
56
  @st.cache_data
57
- def audio_speech_recognition(_model_pipeline, video="video.mp3"):
58
  return _model_pipeline(video, batch_size=64)["text"].strip()
59
 
60
  #Make the Summarization task
@@ -120,7 +122,7 @@ def main():
120
  with st.spinner("Carregando modelos..."):
121
 
122
  if language == "Inglês (en)":
123
- download_audio(link)
124
  load_nltk()
125
  whisper = load_whisper()
126
  extractive = load_extractive()
@@ -133,7 +135,7 @@ def main():
133
  st.header("Erro na seleção de linguagem.")
134
 
135
  with st.spinner("Transcrevendo texto..."):
136
- transcript_text = audio_speech_recognition(whisper)
137
 
138
  with model_1:
139
  st.header("Texto Sumarizado:")
 
18
  )
19
 
20
  #@st.cache_resource
 
21
  def download_audio(link):
22
+ with yt_dlp.YoutubeDL({'extract_audio': True, 'format': 'bestaudio', 'outtmpl': '%(id)s.mp3'}) as video:
23
+ info_dict = video.extract_info(link, download = True)
24
+ id = info_dict['id']
25
+ video.download(link)
26
+ return id
27
 
28
  #Load Whisper pipeline via HuggingFace
29
  @st.cache_resource
 
56
 
57
  #Make the ASR task
58
  @st.cache_data
59
+ def audio_speech_recognition(_model_pipeline, video_id):
60
  return _model_pipeline(video, batch_size=64)["text"].strip()
61
 
62
  #Make the Summarization task
 
122
  with st.spinner("Carregando modelos..."):
123
 
124
  if language == "Inglês (en)":
125
+ id = download_audio(link)
126
  load_nltk()
127
  whisper = load_whisper()
128
  extractive = load_extractive()
 
135
  st.header("Erro na seleção de linguagem.")
136
 
137
  with st.spinner("Transcrevendo texto..."):
138
+ transcript_text = audio_speech_recognition(whisper, id)
139
 
140
  with model_1:
141
  st.header("Texto Sumarizado:")