adi-123's picture
Update utils.py
2862b53 verified
raw
history blame
4.52 kB
import re
import os
import streamlit as st
import requests
from transformers import pipeline
from typing import Dict
from together import Together
from gtts import gTTS
from gmail_smtplib_micro import GmailSMTPLib, Email
# Image-to-text
def img2txt(url: str) -> str:
print("Initializing captioning model...")
captioning_model = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base")
print("Generating text from the image...")
text = captioning_model(url, max_new_tokens=20)[0]["generated_text"]
print(text)
return text
# Text-to-story generation with LLM model
def txt2story(prompt: str, top_k: int, top_p: float, temperature: float) -> str:
# Load the Together API client
client = Together(api_key=os.environ.get("TOGETHER_API_KEY"))
# Modify the prompt based on user inputs and ensure a 250-word limit
story_prompt = f"Write a short story of no more than 250 words based on the following prompt: {prompt}"
# Call the LLM model
stream = client.chat.completions.create(
model="meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",
messages=[
{"role": "system", "content": '''As an experienced short story writer, write a meaningful story influenced by the provided prompt.
Ensure the story does not exceed 250 words.'''},
{"role": "user", "content": story_prompt}
],
top_k=top_k,
top_p=top_p,
temperature=temperature,
stream=True
)
# Concatenate story chunks
story = ''
for chunk in stream:
story += chunk.choices[0].delta.content
return story
# Text-to-speech
def txt2speech(text: str) -> None:
print("Converting text to speech using gTTS...")
# Generate audio from the text
tts = gTTS(text=text, lang='en')
# Save the audio output to a file
tts.save("audio_story.mp3")
# Get user preferences for the story
def get_user_preferences() -> Dict[str, str]:
preferences = {}
preferences['continent'] = st.selectbox("Continent", ["North America", "Europe", "Asia", "Africa", "Australia"])
preferences['genre'] = st.selectbox("Genre", ["Science Fiction", "Fantasy", "Mystery", "Romance"])
preferences['setting'] = st.selectbox("Setting", ["Future", "Medieval times", "Modern day", "Alternate reality"])
preferences['plot'] = st.selectbox("Plot", ["Hero's journey", "Solving a mystery", "Love story", "Survival"])
preferences['tone'] = st.selectbox("Tone", ["Serious", "Light-hearted", "Humorous", "Dark"])
preferences['theme'] = st.selectbox("Theme", ["Self-discovery", "Redemption", "Love", "Justice"])
preferences['conflict'] = st.selectbox("Conflict Type", ["Person vs. Society", "Internal struggle", "Person vs. Nature", "Person vs. Person"])
preferences['twist'] = st.selectbox("Mystery/Twist", ["Plot twist", "Hidden identity", "Unexpected ally/enemy", "Time paradox"])
preferences['ending'] = st.selectbox("Ending", ["Happy", "Bittersweet", "Open-ended", "Tragic"])
return preferences
def create_gmail_config():
"""
Creates a Gmail configuration file if it doesn't exist
"""
config_content = f"""[GMail]
username = {os.getenv('SENDER_EMAIL', '')}
password = {os.getenv('SENDER_PASSWORD', '')}
"""
with open('pysnail.conf', 'w') as f:
f.write(config_content)
def send_story_email(recipient_email: str, story_text: str, audio_file_path: str) -> bool:
"""
Send the story text and audio file to the specified email address
Returns True if successful, False otherwise
"""
try:
# Create email content
subject = "Your Generated Story"
body = f"""Here's your generated story:
{story_text}
Enjoy!"""
# Create email object
email = Email(subject, body)
# Add audio file attachment
email.add_attachment(audio_file_path)
# Create Gmail configuration if it doesn't exist
if not os.path.exists('pysnail.conf'):
create_gmail_config()
# Initialize Gmail client and send email
gmail = GmailSMTPLib('pysnail.conf')
gmail.send_object(email, recipient_email)
return True
except Exception as e:
print(f"Error sending email: {str(e)}")
return False
def validate_email(email: str) -> bool:
"""
Basic email validation
"""
pattern = r'^[\w\.-]+@[\w\.-]+\.\w+$'
return re.match(pattern, email) is not None