Spaces:

Sayiqa7
/

youtbe_content_summ

Running

App Files Files Community

Sayiqa7 commited on Dec 29, 2024

Commit

f60d1cb

verified ·

1 Parent(s): 196d2a2

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -49

app.py CHANGED Viewed

@@ -144,52 +144,35 @@ else:
 ##########################
-def get_video_info(url, max_retries=3):
-    """Get video title and transcript with retries"""
-    video_id = extract_video_id(url)
-    if not video_id:
-        return None, "Invalid YouTube URL"
-    # Try multiple times to get video info
-    for attempt in range(max_retries):
-        try:
-            # Initialize YouTube object with additional parameters
-            yt = YouTube(
-                url,
-                use_oauth=False,
-                allow_oauth_cache=True
-            )
-            # Add a small delay
-            time.sleep(1)
-            # Try to get title, with fallback
-            try:
-                title = yt.title
-            except:
-                title = f"Video {video_id}"
-            # Try to get transcript (including auto-generated captions)
-            transcript = None
-            try:
-                transcript_list = YouTubeTranscriptApi.get_transcript(video_id)
-                transcript = ' '.join([t['text'] for t in transcript_list])
-            except:
-                try:
-                    # Try getting auto-generated transcript
-                    transcript_list = YouTubeTranscriptApi.get_transcript(video_id, languages=['en-US', 'en'])
-                    transcript = ' '.join([t['text'] for t in transcript_list])
-                except Exception as e:
-                    print(f"Transcript error: {str(e)}")
-                    # If both fail, return error message
-                    return None, "No transcript available for this video. Please try a video with captions enabled."
-            return title, transcript
-        except Exception as e:
-            if attempt == max_retries - 1:
-                return None, f"Failed to fetch video information after {max_retries} attempts. Error: {str(e)}"
-            time.sleep(1)  # Wait before retrying
-# Launch the interface
-if __name__ == "__main__":
-    interface.launch()

 ##########################
+from pytube import YouTube
+# Replace with your YouTube video URL
+video_url = "https://www.youtube.com/watch?v=YOUR_VIDEO_ID"
+# Download audio
+yt = YouTube(video_url)
+stream = yt.streams.filter(only_audio=True).first()
+stream.download(filename="audio.mp4")
+from transformers import pipeline
+# Load the speech-to-text pipeline
+transcriber = pipeline(model="openai/whisper-large", task="automatic-speech-recognition")
+# Transcribe the audio file
+result = transcriber("audio.mp4")
+print(result['text'])
+import gradio as gr
+# Define a function for Gradio interface
+def transcribe_audio(audio):
+    result = transcriber(audio.name)
+    return result['text']
+# Create a Gradio interface
+interface = gr.Interface(fn=transcribe_audio, inputs=gr.Audio(), outputs="text")
+# Launch the Gradio interface
+interface.launch()