Spaces:

Agents-MCP-Hackathon
/

Narrated_Slideshow_Generator

Running

App Files Files Community

cp557 commited on Jun 17

Commit

557cacf

verified ·

1 Parent(s): 7f8dde5

Update app.py

Browse files

Files changed (1) hide show

app.py +100 -29

app.py CHANGED Viewed

@@ -1,12 +1,10 @@
 #!/usr/bin/env python3
 """
 Launches a single page Gradio app that:
-1. Accepts a topic/question.
 2. Generates slide markdown + TTS for each slide.
 3. Lets the user page through slides and hear the narration.
-Requires: generate_slideshow.py in the same directory and a valid
-GEMINI_KEY in your environment.
 """
 import asyncio
@@ -30,6 +28,19 @@ custom_css = """
 .input-row {
     margin-bottom: 10px;
 }
 .demo-row {
     margin-bottom: 20px;
     display: flex;
@@ -122,11 +133,14 @@ function animateSlideTransition() {
 }
 """
-async def generate_presentation_async(topic: str, session_id=None):
     """Async version: Generate slides, audio, and images for all slides; initialise UI with slide 0."""
     topic = (topic or "").strip()
-    # Empty topic check is now handled in _run_with_new_session
-    # Notification is shown from the button click handler
     # Create or get a session ID
     if session_id is None:
@@ -137,8 +151,8 @@ async def generate_presentation_async(topic: str, session_id=None):
         active_sessions[session_id] = {}
         active_sessions[session_id]["temp_dir"] = tempfile.mkdtemp(prefix=f"gradio_session_{session_id}_")
-    # Call the async version with the session ID
-    slides, audio_files, slide_images = await generate_slideshow_with_audio_async(topic, session_id=session_id)
     # Basic sanity - keep list lengths aligned for audio
     if len(audio_files) < len(slides):
@@ -160,10 +174,10 @@ async def generate_presentation_async(topic: str, session_id=None):
     return slides, audio_files, slide_images, 0, slides[0], audio_files[0], initial_image, progress_text, session_id
-def generate_presentation(topic: str, session_id=None):
     """Synchronous wrapper for the async presentation generator."""
     # Run the async function and handle empty topic case
-    return asyncio.run(generate_presentation_async(topic, session_id=session_id))
 def next_slide(slides, audio, images, idx, session_id):
@@ -306,10 +320,14 @@ atexit.register(cleanup_all_sessions)
 dino_audio_cache = {}
 dino_image_cache = {}
-def load_rise_fall_slideshow():
     """Load cached dinosaur slideshow demo and hide the demo button and instruction."""
     global dino_audio_cache, dino_image_cache
     # Clear any previous cache
     dino_audio_cache = {}
     dino_image_cache = {}
@@ -420,6 +438,22 @@ with gr.Blocks(
     )
     with gr.Column(elem_classes="container"):
         # First row for topic and generate button - increased horizontal width
         with gr.Row(elem_classes="input-row"):
             topic_box = gr.Textbox(
@@ -460,7 +494,7 @@ with gr.Blocks(
     session_state = gr.State(None)
     # Wiring
-    def prepare_for_generation(topic, session_id):
         """First step: clear the view and prepare for generation"""
         # First check if the topic is empty
         if not (topic or "").strip():
@@ -475,9 +509,34 @@ with gr.Blocks(
                 False  # should_generate
             )
         # Validate the topic using the Gemini Flash input guard
-        if not validate_topic(topic):
-            gr.Info("Please enter a valid topic or question.")
             return (
                 [], [], [], 0, "", None, None, "", session_id,
                 gr.update(visible=True),  # Show topic box
@@ -501,7 +560,7 @@ with gr.Blocks(
             True  # should_generate
         )
-    def _run_with_new_session(topic, session_id, should_generate):
         """Second step: actually generate the slideshow"""
         if not should_generate:
             # This case should ideally not be hit if UI updates from prepare_for_generation are correct
@@ -516,15 +575,27 @@ with gr.Blocks(
                 False # should_generate (though this output isn't strictly used here, keeping tuple size consistent)
             )
-        results = generate_presentation(topic, session_id)
-        return (*results,
-                gr.update(visible=False),
-                gr.update(visible=False),
-                gr.update(value="Generate", interactive=True),
-                gr.update(visible=False),
-                gr.update(visible=False),
-                True # should_generate (maintaining tuple size, actual value less critical here)
-               )
     # Two-step process for generation
     # 1. First clear the UI & validate
@@ -532,7 +603,7 @@ with gr.Blocks(
     gen_btn.click(
         prepare_for_generation,
-        inputs=[topic_box, session_state],
         outputs=[
             slides_state,
             audio_state,
@@ -552,7 +623,7 @@ with gr.Blocks(
         ]
     ).then(  # 2. Then (conditionally) generate the slideshow
         _run_with_new_session,
-        inputs=[topic_box, session_state, should_generate_state],
         outputs=[
             slides_state,
             audio_state,
@@ -587,11 +658,11 @@ with gr.Blocks(
     # Load cached demo slideshow
     demo_btn.click(
         load_rise_fall_slideshow,
-        inputs=[],
         outputs=[slides_state, audio_state, images_state, index_state, slide_markdown, audio_player, title_image,
                progress_indicator, session_state, demo_btn, demo_instruction],
     )
 if __name__ == "__main__":
-    demo.launch()

 #!/usr/bin/env python3
 """
 Launches a single page Gradio app that:
+1. Accepts a topic/question and Gemini API key.
 2. Generates slide markdown + TTS for each slide.
 3. Lets the user page through slides and hear the narration.
+Requires: generate_slideshow.py in the same directory
 """
 import asyncio
 .input-row {
     margin-bottom: 10px;
 }
+.api-key-section {
+    margin-bottom: 20px;
+    padding: 15px;
+    border: 1px solid #ddd;
+    border-radius: 8px;
+    background-color: #f9f9f9;
+}
+.api-key-note {
+    font-size: 0.9em;
+    color: #666;
+    margin-top: 5px;
+    line-height: 1.5;
+}
 .demo-row {
     margin-bottom: 20px;
     display: flex;
 }
 """
+async def generate_presentation_async(topic: str, api_key: str, session_id=None):
     """Async version: Generate slides, audio, and images for all slides; initialise UI with slide 0."""
     topic = (topic or "").strip()
+    api_key = (api_key or "").strip()
+    # Validate API key
+    if not api_key:
+        raise gr.Error("Please enter your Gemini API key")
     # Create or get a session ID
     if session_id is None:
         active_sessions[session_id] = {}
         active_sessions[session_id]["temp_dir"] = tempfile.mkdtemp(prefix=f"gradio_session_{session_id}_")
+    # Call the async version with the session ID and API key
+    slides, audio_files, slide_images = await generate_slideshow_with_audio_async(topic, api_key, session_id=session_id)
     # Basic sanity - keep list lengths aligned for audio
     if len(audio_files) < len(slides):
     return slides, audio_files, slide_images, 0, slides[0], audio_files[0], initial_image, progress_text, session_id
+def generate_presentation(topic: str, api_key: str, session_id=None):
     """Synchronous wrapper for the async presentation generator."""
     # Run the async function and handle empty topic case
+    return asyncio.run(generate_presentation_async(topic, api_key, session_id=session_id))
 def next_slide(slides, audio, images, idx, session_id):
 dino_audio_cache = {}
 dino_image_cache = {}
+def load_rise_fall_slideshow(api_key):
     """Load cached dinosaur slideshow demo and hide the demo button and instruction."""
     global dino_audio_cache, dino_image_cache
+    # API key is required even for demo
+    if not api_key:
+        raise gr.Error("Please enter your Gemini API key first")
     # Clear any previous cache
     dino_audio_cache = {}
     dino_image_cache = {}
     )
     with gr.Column(elem_classes="container"):
+        # API Key section
+        with gr.Group(elem_classes="api-key-section"):
+            api_key_input = gr.Textbox(
+                label="Gemini API Key",
+                placeholder="Enter your Gemini API key here",
+                type="password",
+                scale=1
+            )
+            gr.HTML(
+                """<div class="api-key-note">
+                    <strong>Note:</strong> You need a Gemini API key with billing enabled to use this app.<br>
+                    Get your API key from <a href="https://aistudio.google.com/app/apikey" target="_blank">Google AI Studio</a>.<br>
+                    <em>Important: Make sure to enable billing on your Google Cloud account for API access.</em>
+                </div>"""
+            )
         # First row for topic and generate button - increased horizontal width
         with gr.Row(elem_classes="input-row"):
             topic_box = gr.Textbox(
     session_state = gr.State(None)
     # Wiring
+    def prepare_for_generation(topic, api_key, session_id):
         """First step: clear the view and prepare for generation"""
         # First check if the topic is empty
         if not (topic or "").strip():
                 False  # should_generate
             )
+        # Check if API key is provided
+        if not (api_key or "").strip():
+            gr.Info("Please enter your Gemini API key.")
+            return (
+                [], [], [], 0, "", None, None, "", session_id,
+                gr.update(visible=True),  # Show topic box
+                gr.update(visible=True),  # Show generate button
+                gr.update(value="Generate", interactive=True),  # Reset button state
+                gr.update(visible=True),  # Show dinosaur button
+                gr.update(visible=True),  # Show instruction
+                False  # should_generate
+            )
         # Validate the topic using the Gemini Flash input guard
+        try:
+            if not validate_topic(topic, api_key):
+                gr.Info("Please enter a valid topic or question.")
+                return (
+                    [], [], [], 0, "", None, None, "", session_id,
+                    gr.update(visible=True),  # Show topic box
+                    gr.update(visible=True),  # Show generate button
+                    gr.update(value="Generate", interactive=True),  # Reset button state
+                    gr.update(visible=True),  # Show dinosaur button
+                    gr.update(visible=True),  # Show instruction
+                    False  # should_generate
+                )
+        except Exception as e:
+            gr.Error(f"Error validating topic: {str(e)}. Please check your API key.")
             return (
                 [], [], [], 0, "", None, None, "", session_id,
                 gr.update(visible=True),  # Show topic box
             True  # should_generate
         )
+    def _run_with_new_session(topic, api_key, session_id, should_generate):
         """Second step: actually generate the slideshow"""
         if not should_generate:
             # This case should ideally not be hit if UI updates from prepare_for_generation are correct
                 False # should_generate (though this output isn't strictly used here, keeping tuple size consistent)
             )
+        try:
+            results = generate_presentation(topic, api_key, session_id)
+            return (*results,
+                    gr.update(visible=False),
+                    gr.update(visible=False),
+                    gr.update(value="Generate", interactive=True),
+                    gr.update(visible=False),
+                    gr.update(visible=False),
+                    True # should_generate (maintaining tuple size, actual value less critical here)
+                   )
+        except Exception as e:
+            gr.Error(f"Error generating slideshow: {str(e)}")
+            return (
+                [], [], [], 0, "Error generating slideshow. Please check your API key and try again.", None, None, "", session_id,
+                gr.update(visible=True),
+                gr.update(visible=True),
+                gr.update(value="Generate", interactive=True),
+                gr.update(visible=True),
+                gr.update(visible=True),
+                False
+            )
     # Two-step process for generation
     # 1. First clear the UI & validate
     gen_btn.click(
         prepare_for_generation,
+        inputs=[topic_box, api_key_input, session_state],
         outputs=[
             slides_state,
             audio_state,
         ]
     ).then(  # 2. Then (conditionally) generate the slideshow
         _run_with_new_session,
+        inputs=[topic_box, api_key_input, session_state, should_generate_state],
         outputs=[
             slides_state,
             audio_state,
     # Load cached demo slideshow
     demo_btn.click(
         load_rise_fall_slideshow,
+        inputs=[api_key_input],
         outputs=[slides_state, audio_state, images_state, index_state, slide_markdown, audio_player, title_image,
                progress_indicator, session_state, demo_btn, demo_instruction],
     )
 if __name__ == "__main__":
+    demo.launch()