Spaces:

adi-123
/

Image-to-Audio_Story_Generator

Running

App Files Files Community

adi-123 commited on Nov 1, 2024

Commit

a814e5a

verified ·

1 Parent(s): 2862b53

Update app.py

Browse files

Files changed (1) hide show

app.py +128 -51

app.py CHANGED Viewed

@@ -4,69 +4,146 @@ import requests
 from transformers import pipeline
 from typing import Dict
 from together import Together
-from utils import img2txt, txt2story, txt2speech, get_user_preferences
-# Main function
 def main():
-    st.set_page_config(page_title="🎨 Image-to-Audio Story 🎧", page_icon="🖼️")
     st.title("Turn the Image into Audio Story")
-    # Allows users to upload an image file
-    uploaded_file = st.file_uploader("# 📷 Upload an image...", type=["jpg", "jpeg", "png"])
-    # Parameters for LLM model (in the sidebar)
-    st.sidebar.markdown("# LLM Inference Configuration Parameters")
-    top_k = st.sidebar.number_input("Top-K", min_value=1, max_value=100, value=5)
-    top_p = st.sidebar.number_input("Top-P", min_value=0.0, max_value=1.0, value=0.8)
-    temperature = st.sidebar.number_input("Temperature", min_value=0.1, max_value=2.0, value=1.5)
-    # Get user preferences for the story
-    st.markdown("## Story Preferences")
-    preferences = get_user_preferences()
-    if uploaded_file is not None:
-        # Reads and saves uploaded image file
-        bytes_data = uploaded_file.read()
-        with open("uploaded_image.jpg", "wb") as file:
-            file.write(bytes_data)
-        st.image(uploaded_file, caption='🖼️ Uploaded Image', use_column_width=True)
-        # Initiates AI processing and story generation
-        with st.spinner("## 🤖 AI is at Work! "):
-            scenario = img2txt("uploaded_image.jpg")  # Extracts text from the image
-            # Modify the prompt to include user preferences
-            prompt = f"Based on the image description: '{scenario}', create a {preferences['genre']} story set in {preferences['setting']} in {preferences['continent']}. " \
-                     f"The story should have a {preferences['tone']} tone and explore the theme of {preferences['theme']}. " \
-                     f"The main conflict should be {preferences['conflict']}. " \
-                     f"The story should have a {preferences['twist']} and end with a {preferences['ending']} ending."
-            story = txt2story(prompt, top_k, top_p, temperature)  # Generates a story based on the image text, LLM params, and user preferences
-            txt2speech(story)  # Converts the story to audio
-            st.markdown("---")
-            st.markdown("## 📜 Image Caption")
-            st.write(scenario)
-            st.markdown("---")
-            st.markdown("## 📖 Story")
-            st.write(story)
-            st.markdown("---")
-            st.markdown("## 🎧 Audio Story")
-            st.audio("audio_story.mp3")
 if __name__ == '__main__':
-    main()
-# Credits
-st.markdown("### Credits")
-st.caption('''
-            Made with ❤️ by @Aditya-Neural-Net-Ninja\n
-            Utilizes Image-to-Text model, Text Generation model, Google Text-to-Speech libraary\n
-            Gratitude to Streamlit, 🤗 Spaces for Deployment & Hosting
-            ''')

 from transformers import pipeline
 from typing import Dict
 from together import Together
+from utils import (
+    img2txt,
+    txt2story,
+    txt2speech,
+    get_user_preferences,
+    send_story_email,
+    validate_email,
+    create_gmail_config
+)
 def main():
+    # Page configuration
+    st.set_page_config(
+        page_title="🎨 Image-to-Audio Story 🎧",
+        page_icon="🖼️",
+        layout="wide"
+    )
     st.title("Turn the Image into Audio Story")
+    # Check for Gmail configuration in sidebar
+    if not os.path.exists('pysnail.conf'):
+        st.sidebar.markdown("## 📧 Email Configuration")
+        with st.sidebar.expander("Configure Gmail Settings", expanded=True):
+            sender_email = st.text_input("Gmail Address:", type="default", key="gmail")
+            sender_password = st.text_input("App Password:", type="password", key="password")
+            if st.button("Save Configuration"):
+                if sender_email and sender_password:
+                    os.environ['SENDER_EMAIL'] = sender_email
+                    os.environ['SENDER_PASSWORD'] = sender_password
+                    create_gmail_config()
+                    st.success("Email configuration saved successfully!")
+                else:
+                    st.error("Please provide both email and password.")
+    # LLM Parameters in sidebar
+    st.sidebar.markdown("# ⚙️ LLM Configuration")
+    with st.sidebar.expander("Model Parameters", expanded=False):
+        top_k = st.number_input("Top-K", min_value=1, max_value=100, value=5)
+        top_p = st.number_input("Top-P", min_value=0.0, max_value=1.0, value=0.8)
+        temperature = st.number_input("Temperature", min_value=0.1, max_value=2.0, value=1.5)
+    # Main content area
+    col1, col2 = st.columns([2, 3])
+    with col1:
+        # Image upload section
+        st.markdown("## 📷 Upload Image")
+        uploaded_file = st.file_uploader(
+            "Choose an image...",
+            type=["jpg", "jpeg", "png"],
+            help="Upload an image to generate a story from"
+        )
+        # Story preferences section
+        st.markdown("## 🎭 Story Preferences")
+        preferences = get_user_preferences()
+    with col2:
+        if uploaded_file is not None:
+            # Display uploaded image
+            st.markdown("## 🖼️ Your Image")
+            bytes_data = uploaded_file.read()
+            with open("uploaded_image.jpg", "wb") as file:
+                file.write(bytes_data)
+            st.image(uploaded_file, use_column_width=True)
+            # Process image and generate story
+            if st.button("🎨 Generate Story"):
+                with st.spinner("🤖 AI is working its magic..."):
+                    try:
+                        # Get image description
+                        scenario = img2txt("uploaded_image.jpg")
+                        # Create story prompt
+                        prompt = f"""Based on the image description: '{scenario}',
+                        create a {preferences['genre']} story set in {preferences['setting']}
+                        in {preferences['continent']}. The story should have a {preferences['tone']}
+                        tone and explore the theme of {preferences['theme']}. The main conflict
+                        should be {preferences['conflict']}. The story should have a {preferences['twist']}
+                        and end with a {preferences['ending']} ending."""
+                        # Generate story
+                        story = txt2story(prompt, top_k, top_p, temperature)
+                        # Convert to audio
+                        txt2speech(story)
+                        # Display results
+                        st.markdown("---")
+                        # Image caption
+                        with st.expander("📜 Image Caption", expanded=True):
+                            st.write(scenario)
+                        # Story text
+                        with st.expander("📖 Generated Story", expanded=True):
+                            st.write(story)
+                        # Audio player
+                        with st.expander("🎧 Audio Version", expanded=True):
+                            st.audio("audio_story.mp3")
+                        # Email section
+                        st.markdown("---")
+                        st.markdown("## 📧 Get Story via Email")
+                        # Only show email input if configuration exists
+                        if os.path.exists('pysnail.conf'):
+                            email = st.text_input(
+                                "Enter your email address:",
+                                help="We'll send you the story text and audio file"
+                            )
+                            if st.button("📤 Send to Email"):
+                                if not email:
+                                    st.warning("Please enter an email address.")
+                                elif not validate_email(email):
+                                    st.error("Please enter a valid email address.")
+                                else:
+                                    with st.spinner("📨 Sending email..."):
+                                        if send_story_email(email, story, "audio_story.mp3"):
+                                            st.success("✉️ Story sent successfully! Check your email.")
+                                        else:
+                                            st.error("❌ Failed to send email. Please try again.")
+                        else:
+                            st.warning("⚠️ Please configure Gmail settings in the sidebar to enable email delivery.")
+                    except Exception as e:
+                        st.error(f"An error occurred: {str(e)}")
+                        st.warning("Please try again or contact support if the problem persists.")
+    # Footer
+    st.markdown("---")
+    st.markdown("### Credits")
+    st.caption('''
+        Made with ❤️ by @Aditya-Neural-Net-Ninja\n
+        Utilizes Image-to-Text model, Text Generation model, Google Text-to-Speech library\n
+        Gratitude to Streamlit, 🤗 Spaces for Deployment & Hosting
+    ''')
 if __name__ == '__main__':
+    main()