someshb07 commited on
Commit
d4317f5
·
verified ·
1 Parent(s): f37e37c

Create Youtube_summarizer.py

Browse files
Files changed (1) hide show
  1. Youtube_summarizer.py +32 -0
Youtube_summarizer.py ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ from youtube_transcript_api import YouTubeTranscriptApi
3
+ from youtube_transcript_api.formatters import TextFormatter
4
+ from transformers import pipeline
5
+ import re
6
+ import gradio
7
+
8
+ pipe = pipeline("summarization", model="Falconsai/text_summarization")
9
+
10
+ def summary(text_transcript):
11
+ output = pipe(text_transcript)
12
+ return output[0]['summary_text']
13
+
14
+ def get_youtube_transcript(link):
15
+ video_id= extract_youtube_id(link)
16
+ if not video_id:
17
+ return "Video ID could not be extracted"
18
+
19
+ try:
20
+ transcript= YouTubeTranscriptApi.get_transcript(video_id) # fetches the trancript
21
+
22
+ formatter= TextFormatter()
23
+ text_transcript = formatter.format_transcript(transcript) # This will format the transcript
24
+
25
+ summarized_text = summary(text_transcript)
26
+
27
+ return summarized_text
28
+ except Exception as e:
29
+ return f"An error has occured: {e}"
30
+
31
+
32
+