someshb07 commited on
Commit
945679c
·
verified ·
1 Parent(s): e8f1cde

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +13 -4
app.py CHANGED
@@ -3,9 +3,14 @@ from youtube_transcript_api import YouTubeTranscriptApi
3
  from youtube_transcript_api.formatters import TextFormatter
4
  from transformers import pipeline
5
  import re
6
- import gradio
7
 
8
- pipe = pipeline("summarization", model="Falconsai/text_summarization")
 
 
 
 
 
9
 
10
  def extract_youtube_id(url):
11
  """
@@ -26,8 +31,12 @@ def extract_youtube_id(url):
26
  return None
27
 
28
  def summary(text_transcript):
29
- output = pipe(text_transcript)
30
- return output[0]['summary_text']
 
 
 
 
31
 
32
  def get_youtube_transcript(link):
33
  video_id= extract_youtube_id(link)
 
3
  from youtube_transcript_api.formatters import TextFormatter
4
  from transformers import pipeline
5
  import re
6
+ import gradio as gr
7
 
8
+ pipe = pipeline("summarization", model="Falconsai/text_summarization", device=-1)
9
+
10
+ def chunk_length(text, max_length = 1024):
11
+ words = text.split()
12
+ for i in range(0, len(words), max_length)
13
+ yield " ".join(words[i:i + max_length])
14
 
15
  def extract_youtube_id(url):
16
  """
 
31
  return None
32
 
33
  def summary(text_transcript):
34
+ try:
35
+ chunks = chunk_text(text_transcript)
36
+ summarized_chunks = [pipe(chunk)[0]['summary_text'] for chunk in chunks]
37
+ return " ".join(summarized_chunks)
38
+ except Exception as e:
39
+ return f"Error during summarization: {e}"
40
 
41
  def get_youtube_transcript(link):
42
  video_id= extract_youtube_id(link)