Spaces:

sigridveronica
/

ai-news-analyzer

Running

App Files Files Community

Sigrid De los Santos commited on 10 days ago

Commit

0d9c76e

1 Parent(s): da7cc35

Add matplotlib to requirements

Browse files

Files changed (1) hide show

src/main.py +37 -59

src/main.py CHANGED Viewed

@@ -3,9 +3,6 @@ import sys
 from datetime import datetime
 from dotenv import load_dotenv
 import pandas as pd
-from io import BytesIO
-import base64
-import matplotlib.pyplot as plt
 from md_html import convert_single_md_to_html as convert_md_to_html
 from news_analysis import fetch_deep_news, generate_value_investor_report
@@ -32,33 +29,16 @@ def build_metrics_box(topic, num_articles):
 >
 """
-def create_sentiment_chart_md(topic):
-    # Placeholder dummy chart
-    dates = pd.date_range(end=datetime.today(), periods=7)
-    values = [100 + i * 3 for i in range(7)]
-    plt.figure(figsize=(6, 3))
-    plt.plot(dates, values, marker='o')
-    plt.title(f"📈 Sentiment Trend: {topic}")
-    plt.xlabel("Date")
-    plt.ylabel("Sentiment")
-    plt.grid(True)
-    buffer = BytesIO()
-    plt.savefig(buffer, format='png')
-    plt.close()
-    buffer.seek(0)
-    encoded = base64.b64encode(buffer.read()).decode("utf-8")
-    return f"![Sentiment Trend](data:image/png;base64,{encoded})"
-def run_value_investing_analysis(csv_path):
     current_df = pd.read_csv(csv_path)
     prev_path = os.path.join(BASE_DIR, "investing_topics_prev.csv")
     if os.path.exists(prev_path):
         previous_df = pd.read_csv(prev_path)
         changed_df = detect_changes(current_df, previous_df)
         if changed_df.empty:
-            print("✅ No changes detected. Skipping processing.")
             return []
     else:
         changed_df = current_df
@@ -68,18 +48,25 @@ def run_value_investing_analysis(csv_path):
     for _, row in changed_df.iterrows():
         topic = row.get("topic")
         timespan = row.get("timespan_days", 7)
-        print(f"\n🔍 Processing: {topic} ({timespan} days)")
         news = fetch_deep_news(topic, timespan)
         if not news:
-            print(f"⚠️ No news found for: {topic}")
             continue
         report_body = generate_value_investor_report(topic, news)
-        chart_md = create_sentiment_chart_md(topic)
         metrics_md = build_metrics_box(topic, len(news))
-        full_md = metrics_md + report_body + "\n\n" + chart_md
         base_filename = f"{topic.replace(' ', '_').lower()}_{datetime.now().strftime('%Y-%m-%d')}"
         filename = base_filename + ".md"
@@ -96,14 +83,15 @@ def run_value_investing_analysis(csv_path):
         new_md_files.append(filepath)
-    print(f"✅ Markdown saved to: {DATA_DIR}")
     current_df.to_csv(prev_path, index=False)
     return new_md_files
-def run_pipeline(csv_path, tavily_api_key):
     os.environ["TAVILY_API_KEY"] = tavily_api_key
-    new_md_files = run_value_investing_analysis(csv_path)
     new_html_paths = []
     for md_path in new_md_files:
@@ -119,18 +107,19 @@ if __name__ == "__main__":
         convert_md_to_html(md, HTML_DIR)
     print(f"🌐 All reports converted to HTML at: {HTML_DIR}")
 # import os
 # import sys
 # from datetime import datetime
 # from dotenv import load_dotenv
-# import pandas as pd
 # from image_search import search_unsplash_image
 # from md_html import convert_single_md_to_html as convert_md_to_html
 # from news_analysis import fetch_deep_news, generate_value_investor_report
 # from csv_utils import detect_changes
 # # Setup paths
 # BASE_DIR = os.path.dirname(os.path.dirname(__file__))  # one level up from src/
 # DATA_DIR = os.path.join(BASE_DIR, "data")
@@ -152,16 +141,14 @@ if __name__ == "__main__":
 # >
 # """
-# def run_value_investing_analysis(csv_path, progress_callback=None):
 #     current_df = pd.read_csv(csv_path)
 #     prev_path = os.path.join(BASE_DIR, "investing_topics_prev.csv")
 #     if os.path.exists(prev_path):
 #         previous_df = pd.read_csv(prev_path)
 #         changed_df = detect_changes(current_df, previous_df)
 #         if changed_df.empty:
-#             if progress_callback:
-#                 progress_callback("✅ No changes detected. Skipping processing.")
 #             return []
 #     else:
 #         changed_df = current_df
@@ -171,24 +158,20 @@ if __name__ == "__main__":
 #     for _, row in changed_df.iterrows():
 #         topic = row.get("topic")
 #         timespan = row.get("timespan_days", 7)
-#         if progress_callback:
-#             progress_callback(f"🔍 Processing: {topic} ({timespan} days)")
 #         news = fetch_deep_news(topic, timespan)
 #         if not news:
-#             if progress_callback:
-#                 progress_callback(f"⚠️ No news found for: {topic}")
 #             continue
-#         if progress_callback:
-#             progress_callback(f"🧠 Analyzing news for: {topic}")
 #         report_body = generate_value_investor_report(topic, news)
-#         # Use placeholder image instead of API call
-#         image_url = "https://via.placeholder.com/1281x721?text=No+Image"
-#         image_credit = "Image unavailable"
 #         metrics_md = build_metrics_box(topic, len(news))
 #         full_md = metrics_md + report_body
@@ -203,39 +186,34 @@ if __name__ == "__main__":
 #             filepath = os.path.join(DATA_DIR, filename)
 #             counter += 1
-#         if progress_callback:
-#             progress_callback(f"📝 Saving markdown for: {topic}")
 #         with open(filepath, "w", encoding="utf-8") as f:
 #             f.write(full_md)
 #         new_md_files.append(filepath)
-#     if progress_callback:
-#         progress_callback(f"✅ Markdown reports saved to: `{DATA_DIR}`")
 #     current_df.to_csv(prev_path, index=False)
 #     return new_md_files
-# def run_pipeline(csv_path, tavily_api_key, progress_callback=None):
 #     os.environ["TAVILY_API_KEY"] = tavily_api_key
-#     new_md_files = run_value_investing_analysis(csv_path, progress_callback)
 #     new_html_paths = []
 #     for md_path in new_md_files:
-#         if progress_callback:
-#             progress_callback(f"🌐 Converting to HTML: {os.path.basename(md_path)}")
 #         convert_md_to_html(md_path, HTML_DIR)
 #         html_path = os.path.join(HTML_DIR, os.path.basename(md_path).replace(".md", ".html"))
 #         new_html_paths.append(html_path)
 #     return new_html_paths
 # if __name__ == "__main__":
 #     md_files = run_value_investing_analysis(CSV_PATH)
 #     for md in md_files:
 #         convert_md_to_html(md, HTML_DIR)
 #     print(f"🌐 All reports converted to HTML at: {HTML_DIR}")

 from datetime import datetime
 from dotenv import load_dotenv
 import pandas as pd
 from md_html import convert_single_md_to_html as convert_md_to_html
 from news_analysis import fetch_deep_news, generate_value_investor_report
 >
 """
+def run_value_investing_analysis(csv_path, progress_callback=None):
     current_df = pd.read_csv(csv_path)
     prev_path = os.path.join(BASE_DIR, "investing_topics_prev.csv")
     if os.path.exists(prev_path):
         previous_df = pd.read_csv(prev_path)
         changed_df = detect_changes(current_df, previous_df)
         if changed_df.empty:
+            if progress_callback:
+                progress_callback("✅ No changes detected. Skipping processing.")
             return []
     else:
         changed_df = current_df
     for _, row in changed_df.iterrows():
         topic = row.get("topic")
         timespan = row.get("timespan_days", 7)
+        msg = f"🔍 Processing: {topic} ({timespan} days)"
+        print(msg)
+        if progress_callback:
+            progress_callback(msg)
         news = fetch_deep_news(topic, timespan)
         if not news:
+            warning = f"⚠️ No news found for: {topic}"
+            print(warning)
+            if progress_callback:
+                progress_callback(warning)
             continue
         report_body = generate_value_investor_report(topic, news)
+        image_url = "https://via.placeholder.com/1281x721?text=No+Image+Available"
+        image_credit = "Image placeholder"
         metrics_md = build_metrics_box(topic, len(news))
+        full_md = metrics_md + report_body
         base_filename = f"{topic.replace(' ', '_').lower()}_{datetime.now().strftime('%Y-%m-%d')}"
         filename = base_filename + ".md"
         new_md_files.append(filepath)
+    if progress_callback:
+        progress_callback(f"✅ Markdown saved to: {DATA_DIR}")
     current_df.to_csv(prev_path, index=False)
     return new_md_files
+def run_pipeline(csv_path, tavily_api_key, progress_callback=None):
     os.environ["TAVILY_API_KEY"] = tavily_api_key
+    new_md_files = run_value_investing_analysis(csv_path, progress_callback)
     new_html_paths = []
     for md_path in new_md_files:
         convert_md_to_html(md, HTML_DIR)
     print(f"🌐 All reports converted to HTML at: {HTML_DIR}")
 # import os
 # import sys
 # from datetime import datetime
 # from dotenv import load_dotenv
 # from image_search import search_unsplash_image
 # from md_html import convert_single_md_to_html as convert_md_to_html
 # from news_analysis import fetch_deep_news, generate_value_investor_report
+# import pandas as pd
 # from csv_utils import detect_changes
 # # Setup paths
 # BASE_DIR = os.path.dirname(os.path.dirname(__file__))  # one level up from src/
 # DATA_DIR = os.path.join(BASE_DIR, "data")
 # >
 # """
+# def run_value_investing_analysis(csv_path):
 #     current_df = pd.read_csv(csv_path)
 #     prev_path = os.path.join(BASE_DIR, "investing_topics_prev.csv")
 #     if os.path.exists(prev_path):
 #         previous_df = pd.read_csv(prev_path)
 #         changed_df = detect_changes(current_df, previous_df)
 #         if changed_df.empty:
+#             print("✅ No changes detected. Skipping processing.")
 #             return []
 #     else:
 #         changed_df = current_df
 #     for _, row in changed_df.iterrows():
 #         topic = row.get("topic")
 #         timespan = row.get("timespan_days", 7)
+#         print(f"\n🔍 Processing: {topic} ({timespan} days)")
 #         news = fetch_deep_news(topic, timespan)
 #         if not news:
+#             print(f"⚠️ No news found for: {topic}")
 #             continue
 #         report_body = generate_value_investor_report(topic, news)
+#         from image_search import search_unsplash_image
+#         # Later inside your loop
+#         image_url, image_credit = search_unsplash_image(topic)
+#         #image_url, image_credit = search_unsplash_image(topic, os.getenv("OPENAI_API_KEY"))
 #         metrics_md = build_metrics_box(topic, len(news))
 #         full_md = metrics_md + report_body
 #             filepath = os.path.join(DATA_DIR, filename)
 #             counter += 1
 #         with open(filepath, "w", encoding="utf-8") as f:
 #             f.write(full_md)
 #         new_md_files.append(filepath)
+#     print(f"✅ Markdown saved to: {DATA_DIR}")
 #     current_df.to_csv(prev_path, index=False)
 #     return new_md_files
+# def run_pipeline(csv_path, tavily_api_key):
 #     os.environ["TAVILY_API_KEY"] = tavily_api_key
+#     new_md_files = run_value_investing_analysis(csv_path)
 #     new_html_paths = []
 #     for md_path in new_md_files:
 #         convert_md_to_html(md_path, HTML_DIR)
 #         html_path = os.path.join(HTML_DIR, os.path.basename(md_path).replace(".md", ".html"))
 #         new_html_paths.append(html_path)
 #     return new_html_paths
 # if __name__ == "__main__":
 #     md_files = run_value_investing_analysis(CSV_PATH)
 #     for md in md_files:
 #         convert_md_to_html(md, HTML_DIR)
 #     print(f"🌐 All reports converted to HTML at: {HTML_DIR}")