File size: 7,011 Bytes
e15f81c
3e74eb0
e7bd9fb
 
ad83944
424c4c2
a814e5a
 
 
 
 
 
 
143d77d
a814e5a
e7bd9fb
 
a814e5a
 
 
 
 
e7bd9fb
 
143d77d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
a814e5a
 
 
e7bd9fb
a814e5a
 
 
 
 
 
33ee975
a814e5a
 
ad83944
a814e5a
 
 
 
 
143d77d
a814e5a
e7bd9fb
a814e5a
 
 
e7bd9fb
a814e5a
 
 
 
 
 
 
 
e7bd9fb
a814e5a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
e7bd9fb
a814e5a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
143d77d
 
 
a814e5a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
e7bd9fb
a814e5a
 
 
2b7f7bd
a814e5a
 
 
 
 
 
 
 
f9fdb45
e7bd9fb
a814e5a
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
import os
import streamlit as st
import requests
from transformers import pipeline
from typing import Dict
from together import Together
from utils import (
    img2txt, 
    txt2story, 
    txt2speech, 
    get_user_preferences, 
    send_story_email, 
    validate_email,
    validate_gmail_credentials
)

def main():
    st.set_page_config(
        page_title="🎨 Image-to-Audio Story 🎧",
        page_icon="πŸ–ΌοΈ",
        layout="wide"
    )
    st.title("Turn the Image into Audio Story")

    # Email Configuration in Sidebar
    st.sidebar.markdown("## πŸ“§ Email Configuration")
    with st.sidebar.expander("Configure Gmail Settings", expanded=not bool(os.getenv('SENDER_EMAIL'))):
        sender_email = st.text_input(
            "Gmail Address:",
            value=os.getenv('SENDER_EMAIL', ''),
            type="default",
            key="gmail"
        )
        sender_password = st.text_input(
            "App Password:",
            value=os.getenv('SENDER_PASSWORD', ''),
            type="password",
            key="password",
            help="Use an App Password from your Google Account settings"
        )
        
        if st.button("Save Configuration"):
            if not sender_email or not sender_password:
                st.error("Please provide both email and password.")
            elif not validate_email(sender_email):
                st.error("Please enter a valid Gmail address.")
            else:
                # Validate credentials
                error = validate_gmail_credentials(sender_email, sender_password)
                if error:
                    st.error(f"Failed to validate credentials: {error}")
                else:
                    # Save credentials to environment variables
                    os.environ['SENDER_EMAIL'] = sender_email
                    os.environ['SENDER_PASSWORD'] = sender_password
                    st.success("Email configuration saved successfully!")

    # LLM Parameters in sidebar
    st.sidebar.markdown("# βš™οΈ LLM Configuration")
    with st.sidebar.expander("Model Parameters", expanded=False):
        top_k = st.number_input("Top-K", min_value=1, max_value=100, value=5)
        top_p = st.number_input("Top-P", min_value=0.0, max_value=1.0, value=0.8)
        temperature = st.number_input("Temperature", min_value=0.1, max_value=2.0, value=1.5)

    # Main content area
    col1, col2 = st.columns([2, 3])

    with col1:
        # Image upload section
        st.markdown("## πŸ“· Upload Image")
        uploaded_file = st.file_uploader(
            "Choose an image...", 
            type=["jpg", "jpeg", "png"]
        )

        # Story preferences section
        st.markdown("## 🎭 Story Preferences")
        preferences = get_user_preferences()

    with col2:
        if uploaded_file is not None:
            # Display uploaded image
            st.markdown("## πŸ–ΌοΈ Your Image")
            bytes_data = uploaded_file.read()
            with open("uploaded_image.jpg", "wb") as file:
                file.write(bytes_data)
            st.image(uploaded_file, use_column_width=True)

            # Process image and generate story
            if st.button("🎨 Generate Story"):
                with st.spinner("πŸ€– AI is working its magic..."):
                    try:
                        # Get image description
                        scenario = img2txt("uploaded_image.jpg")
                        
                        # Create story prompt
                        prompt = f"""Based on the image description: '{scenario}', 
                        create a {preferences['genre']} story set in {preferences['setting']} 
                        in {preferences['continent']}. The story should have a {preferences['tone']} 
                        tone and explore the theme of {preferences['theme']}. The main conflict 
                        should be {preferences['conflict']}. The story should have a {preferences['twist']} 
                        and end with a {preferences['ending']} ending."""
                        
                        # Generate story
                        story = txt2story(prompt, top_k, top_p, temperature)
                        
                        # Convert to audio
                        txt2speech(story)

                        # Display results
                        st.markdown("---")
                        
                        # Image caption
                        with st.expander("πŸ“œ Image Caption", expanded=True):
                            st.write(scenario)
                        
                        # Story text
                        with st.expander("πŸ“– Generated Story", expanded=True):
                            st.write(story)
                        
                        # Audio player
                        with st.expander("🎧 Audio Version", expanded=True):
                            st.audio("audio_story.mp3")
                        
                        # Email section
                        if os.getenv('SENDER_EMAIL') and os.getenv('SENDER_PASSWORD'):
                            st.markdown("---")
                            st.markdown("## πŸ“§ Get Story via Email")
                            email = st.text_input(
                                "Enter your email address:",
                                help="We'll send you the story text and audio file"
                            )
                            
                            if st.button("πŸ“€ Send to Email"):
                                if not email:
                                    st.warning("Please enter an email address.")
                                elif not validate_email(email):
                                    st.error("Please enter a valid email address.")
                                else:
                                    with st.spinner("πŸ“¨ Sending email..."):
                                        if send_story_email(email, story, "audio_story.mp3"):
                                            st.success("βœ‰οΈ Story sent successfully! Check your email.")
                                        else:
                                            st.error("❌ Failed to send email. Please try again.")
                        else:
                            st.warning("⚠️ Please configure Gmail settings in the sidebar to enable email delivery.")

                    except Exception as e:
                        st.error(f"An error occurred: {str(e)}")
                        st.warning("Please try again or contact support if the problem persists.")

    # Footer
    st.markdown("---")
    st.markdown("### Credits")
    st.caption('''
        Made with ❀️ by @Aditya-Neural-Net-Ninja\n 
        Utilizes Image-to-Text model, Text Generation model, Google Text-to-Speech library\n
        Gratitude to Streamlit, πŸ€— Spaces for Deployment & Hosting
    ''')

if __name__ == '__main__':
    main()