Spaces:

yuvarajareddy001
/

youtube_comments_sentiment

Running

App Files Files Community

yuvarajareddy001 commited on Jan 22

Commit

46ed0e6

verified ·

1 Parent(s): 8fb954c

Deploying pipeline

Browse files

Files changed (3) hide show

app.py +81 -0
multilingual_sentiment_model.py +163 -0
requirements.txt +6 -0

app.py ADDED Viewed

	@@ -0,0 +1,81 @@

+import gradio as gr
+import pandas as pd
+import logging
+from multilingual_sentiment_model import *
+# === Setup Logging ===
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s - %(levelname)s - %(message)s",
+)
+# Gradio Function with Logging
+def youtube_sentiment_analysis(url, num_of_comments):
+    try:
+        video_id = extract_video_id(url)
+        if not video_id:
+            logging.warning("Invalid YouTube URL entered in UI.")
+            return "Error: Invalid YouTube URL", None, None
+        video_title = get_video_title(video_id)  # Fetch video title
+        comments, error = get_comments(video_id, int(num_of_comments))
+        if error:
+            logging.error(f"Error fetching comments: {error}")
+            return f"Error fetching comments: {error}", None, None
+        if not comments:
+            logging.warning("No comments found for the video.")
+            return "Error: No comments found.", None, None
+        sentiment_results, sentiment_counts = analyze_sentiment(comments)
+        chart = plot_pie_chart(sentiment_counts, video_title)  # Pass title to the chart
+        summary = get_overall_sentiment(sentiment_counts)
+        return summary, chart, pd.DataFrame(sentiment_results).head(5)
+    except Exception as e:
+        logging.exception(f"Unexpected Error: {str(e)}")
+        return f"Unexpected Error: {str(e)}", None, None
+# Gradio Interface (All Outputs Below Input)
+iface = gr.Blocks()
+# Example YouTube URLs
+example_urls = [
+    "https://www.youtube.com/watch?v=0e9WuB0Ua98",
+    "https://www.youtube.com/watch?v=3JZ_D3ELwOQ",
+    "https://youtu.be/dQw4w9WgXcQ",
+    "https://www.youtube.com/watch?v=9bZkp7q19f0",
+    "https://www.youtube.com/watch?v=2Vv-BfVoq4g"
+]
+with iface:
+    gr.Markdown("## YouTube Comment Sentiment Analysis", elem_classes='centered-title')
+    gr.Markdown("Enter a YouTube video URL and specify the number of comments to analyze.")
+    with gr.Row():
+        youtube_url = gr.Textbox(label="YouTube Video URL")
+        num_comments = gr.Slider(minimum=10, maximum=1000, step=1, value=100, label="Number of Comments to Fetch")
+    submit_btn = gr.Button("Submit")
+    # All outputs are placed BELOW the input
+    output_summary = gr.Textbox(label="Overall Sentiment Summary")
+    output_chart = gr.Plot(label="Sentiment Chart")
+    output_table = gr.Dataframe(label="Comment Sentiment Analysis")
+    submit_btn.click(
+        youtube_sentiment_analysis,
+        inputs=[youtube_url, num_comments],
+        outputs=[output_summary, output_chart, output_table],
+    )
+    gr.Markdown("### Example YouTube Video URLs for Testing (Click to Use)")
+    with gr.Row():
+        for example in example_urls:
+            gr.Button(example).click(fn=lambda x=example: x, outputs=[youtube_url])
+# Launch App
+iface.launch(share=True)

multilingual_sentiment_model.py ADDED Viewed

	@@ -0,0 +1,163 @@

+import re
+import pandas as pd
+import matplotlib.pyplot as plt
+import logging
+from googleapiclient.discovery import build
+from transformers import pipeline
+import textwrap
+# === Setup Logging ===
+logging.basicConfig(
+    filename="app_logs.log",  # Log file name
+    level=logging.INFO,  # Log info, warnings, and errors
+    format="%(asctime)s - %(levelname)s - %(message)s",
+)
+# Replace with your API Key
+API_KEY = "AIzaSyAlKTUhY9t3yaJvk0E2goCuLEtcsTOFMBM"
+# Load Hugging Face Sentiment Model
+try:
+    sentiment_classifier = pipeline(
+        model="lxyuan/distilbert-base-multilingual-cased-sentiments-student",
+        top_k=None
+    )
+    logging.info("Sentiment analysis model loaded successfully.")
+except Exception as e:
+    logging.error(f"Failed to load sentiment model: {e}")
+    raise RuntimeError("Error loading sentiment model. Check logs for details.")
+# Extract Video ID from URL
+def extract_video_id(url):
+    """
+    Extracts YouTube video ID from various YouTube URL formats.
+    """
+    try:
+        # Handle multiple YouTube URL formats
+        patterns = [
+            r"(?:https?:\/\/)?(?:www\.)?youtube\.com\/watch\?v=([^&]+)",
+            r"(?:https?:\/\/)?(?:www\.)?youtube\.com\/embed\/([^?]+)",
+            r"(?:https?:\/\/)?(?:www\.)?youtube\.com\/v\/([^?]+)",
+            r"(?:https?:\/\/)?youtu\.be\/([^?]+)"
+        ]
+        for pattern in patterns:
+            match = re.search(pattern, url)
+            if match:
+                video_id = match.group(1)
+                return video_id
+        return None  # If no match found, return None
+    except Exception as e:
+        return None
+# Fetch YouTube Comments with Pagination
+def get_comments(video_id, max_results=500):
+    youtube = build("youtube", "v3", developerKey=API_KEY)
+    comments = []
+    next_page_token = None
+    try:
+        while len(comments) < max_results:
+            request = youtube.commentThreads().list(
+                part="snippet",
+                videoId=video_id,
+                maxResults=min(100, max_results - len(comments)),  # Up to 100 per request
+                textFormat="plainText",
+                pageToken=next_page_token
+            )
+            response = request.execute()
+            for item in response.get("items", []):
+                comment = item["snippet"]["topLevelComment"]["snippet"]["textDisplay"]
+                comments.append(comment)
+            next_page_token = response.get("nextPageToken")
+            if not next_page_token:
+                break
+        logging.info(f"Fetched {len(comments)} comments for Video ID: {video_id}")
+    except Exception as e:
+        logging.error(f"Error fetching comments: {e}")
+        return [], f"Error fetching comments: {e}"
+    return comments[:max_results], None
+def get_video_title(video_id):
+    """
+    Fetches the title of the YouTube video using the YouTube Data API.
+    """
+    youtube = build("youtube", "v3", developerKey=API_KEY)
+    try:
+        request = youtube.videos().list(
+            part="snippet",
+            id=video_id
+        )
+        response = request.execute()
+        if "items" in response and len(response["items"]) > 0:
+            video_title = response["items"][0]["snippet"]["title"]
+            return video_title
+        else:
+            return "Unknown Video Title"
+    except Exception as e:
+        logging.error(f"Error fetching video title: {e}")
+        return "Error Fetching Title"
+# Sentiment Analysis
+def analyze_sentiment(comments):
+    results = []
+    sentiment_counts = {"positive": 0, "neutral": 0, "negative": 0}
+    try:
+        for comment in comments:
+            sentiment_scores = sentiment_classifier(comment)[0]
+            sentiment = max(sentiment_scores, key=lambda x: x['score'])
+            sentiment_label = sentiment['label']
+            sentiment_counts[sentiment_label] += 1
+            results.append({"Comment": comment, "Sentiment": sentiment_label, "Score": sentiment['score']})
+        logging.info("Sentiment analysis completed successfully.")
+    except Exception as e:
+        logging.error(f"Error analyzing sentiment: {e}")
+        return [], f"Error analyzing sentiment: {e}"
+    return results, sentiment_counts
+# Generate Pie Chart
+def plot_pie_chart(sentiment_counts, video_title):
+    """
+    Generates a pie chart for sentiment distribution with a wrapped video title.
+    """
+    try:
+        fig, ax = plt.subplots(figsize=(8,6))  # Increase figure size for better visibility
+        # Wrap title if it's too long
+        wrapped_title = "\n".join(textwrap.wrap(video_title, width=50))  # Wrap title every 50 characters
+        ax.pie(
+            sentiment_counts.values(),
+            labels=sentiment_counts.keys(),
+            autopct='%1.1f%%',
+            startangle=140
+        )
+        ax.set_title(f"Sentiment Analysis for:\n{wrapped_title}", fontsize=10)  # Apply wrapped title
+        logging.info(f"Pie chart generated successfully for {video_title}.")
+        return fig
+    except Exception as e:
+        logging.error(f"Error generating pie chart: {e}")
+        return None
+# Overall Sentiment Summary
+def get_overall_sentiment(sentiment_counts):
+    try:
+        overall_sentiment = f"Overall Video Sentiment: {max(sentiment_counts, key=sentiment_counts.get).upper()}"
+        logging.info(f"Overall Sentiment: {overall_sentiment}")
+        return overall_sentiment
+    except Exception as e:
+        logging.error(f"Error calculating overall sentiment: {e}")
+        return "Error calculating overall sentiment."

requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+google-api-python-client
+transformers
+torch
+pandas
+matplotlib
+gradio