Spaces:
Running
Running
import gradio as gr | |
import os | |
from huggingface_hub import InferenceClient | |
import random | |
from typing import Generator, Dict, List, Tuple, Optional | |
# Get token from environment variable | |
hf_token = os.environ.get("HF_TOKEN") | |
client = InferenceClient("HuggingFaceH4/zephyr-7b-beta", token=hf_token) | |
# Story genres with genre-specific example prompts | |
GENRE_EXAMPLES = { | |
"fairy_tale": [ | |
"I follow the shimmer of fairy dust into a hidden forest" | |
"I meet a talking rabbit who claims to know a secret about the king’s lost crown" | |
"A tiny dragon appears at my window, asking for help to find its mother" | |
"I step into a clearing where the trees whisper ancient riddles" | |
"A friendly witch invites me into her cozy cottage, offering a warm cup of tea" | |
], | |
"fantasy": [ | |
"I enter the ancient forest seeking the wizard's tower", | |
"I approach the dragon cautiously with my shield raised", | |
"I examine the mysterious runes carved into the stone altar", | |
"I try to bargain with the elven council for safe passage" | |
], | |
"sci-fi": [ | |
"I hack into the space station's mainframe", | |
"I investigate the strange signal coming from the abandoned planet", | |
"I negotiate with the alien ambassador about the peace treaty", | |
"I try to repair my damaged spacecraft before oxygen runs out" | |
], | |
"mystery": [ | |
"I examine the crime scene for overlooked evidence", | |
"I question the nervous butler about the night of the murder", | |
"I follow the suspicious figure through the foggy streets", | |
"I check the victim's diary for hidden clues" | |
], | |
"horror": [ | |
"I slowly open the creaking door to the basement", | |
"I read the forbidden text while the candles flicker", | |
"I hide under the bed as footsteps approach", | |
"I investigate the strange noises coming from the attic" | |
], | |
"western": [ | |
"I challenge the outlaw to a duel at high noon", | |
"I track the bandits through the desert canyon", | |
"I enter the saloon looking for information", | |
"I defend the stagecoach from the approaching raiders" | |
], | |
"cyberpunk": [ | |
"I jack into the corporate mainframe to steal data", | |
"I negotiate with the street gang for cybernetic upgrades", | |
"I hide in the neon-lit alleyway from corporate security", | |
"I meet my mysterious client in the underground bar" | |
], | |
"historical": [ | |
"I attend the royal ball hoping to meet the mysterious count", | |
"I join the resistance against the occupying forces", | |
"I navigate the dangerous politics of the royal court", | |
"I set sail on a voyage to discover new lands" | |
], | |
"post-apocalyptic": [ | |
"I scavenge the abandoned shopping mall for supplies", | |
"I approach the fortified settlement seeking shelter", | |
"I navigate through the radioactive zone using my old map", | |
"I hide from the approaching group of raiders" | |
], | |
"steampunk": [ | |
"I pilot my airship through the lightning storm", | |
"I present my new invention to the Royal Academy", | |
"I investigate the mysterious clockwork automaton", | |
"I sneak aboard the emperor's armored train" | |
] | |
} | |
# 2. Add constants at the top for magic numbers | |
MAX_HISTORY_LENGTH = 20 | |
MEMORY_WINDOW = 5 # Reduced from 10 to limit context | |
MAX_TOKENS = 1024 # Reduced from 2048 for faster responses | |
TEMPERATURE = 0.7 # Slightly reduced for faster convergence | |
TOP_P = 0.95 | |
MIN_RESPONSE_LENGTH = 100 # Reduced from 200 for quicker display | |
def get_examples_for_genre(genre): | |
"""Get example prompts specific to the selected genre""" | |
return GENRE_EXAMPLES.get(genre, GENRE_EXAMPLES["fantasy"]) | |
def get_enhanced_system_prompt(genre=None): | |
"""Generate a detailed system prompt with optional genre specification""" | |
selected_genre = genre or "fantasy" | |
system_message = f"""You are an interactive storyteller creating an immersive {selected_genre} choose-your-own-adventure story. | |
For each response you MUST: | |
1. Write 100-200 words describing the scene, using vivid sensory details | |
2. Always use second-person perspective ("you", "your") to maintain reader immersion | |
3. Include dialogue or your character's thoughts that reveal personality and motivations | |
4. Create a strong sense of atmosphere appropriate for {selected_genre} | |
5. End EVERY response with exactly three numbered choices like this: | |
1. [Complete sentence in second-person starting with a verb (e.g., "You decide to..."/"You attempt to...")] | |
2. [Complete sentence in second-person starting with a verb (e.g., "You sneak towards..."/"You call out to...")] | |
3. [Complete sentence in second-person starting with a verb (e.g., "You examine..."/"You reach for...")] | |
IMPORTANT: | |
- Always maintain second-person perspective throughout the narrative | |
- Always end with exactly three numbered choices | |
- Never skip the choices or respond with just narrative | |
- Each choice must start with "You" followed by a verb | |
- Format choices exactly as shown above with numbers 1-3 | |
Keep the story cohesive by referencing previous events and choices.""" | |
return system_message | |
def create_story_summary(chat_history): | |
"""Create a concise summary of the story so far if the history gets too long""" | |
if len(chat_history) <= 2: | |
return None | |
story_text = "" | |
for user_msg, bot_msg in chat_history: | |
story_text += f"User: {user_msg}\nStory: {bot_msg}\n\n" | |
summary_instruction = { | |
"role": "system", | |
"content": "The conversation history is getting long. Please create a brief summary of the key plot points and character development so far to help maintain context without exceeding token limits." | |
} | |
return summary_instruction | |
def format_history_for_gradio(history_tuples): | |
"""Convert chat history to Gradio's message format.""" | |
return [(str(user_msg), str(bot_msg)) for user_msg, bot_msg in history_tuples] | |
# 1. Add type hints for better code maintainability | |
# 4. Add input validation | |
def respond( | |
message: str, | |
chat_history: List[Tuple[str, str]], | |
genre: Optional[str] = None, | |
use_full_memory: bool = True | |
) -> Generator[List[Tuple[str, str]], None, None]: | |
"""Generate a response based on the current message and conversation history.""" | |
if not message.strip(): | |
return chat_history | |
# Use the enhanced system prompt instead of the simple one | |
system_message = get_enhanced_system_prompt(genre) | |
# Format messages for the API | |
formatted_messages = [] | |
# Add system message first | |
formatted_messages.append({ | |
"role": "system", | |
"content": system_message | |
}) | |
# Add chat history | |
if chat_history and use_full_memory: | |
for user_msg, bot_msg in chat_history[-MEMORY_WINDOW:]: | |
formatted_messages.extend([ | |
{"role": "user", "content": str(user_msg)}, | |
{"role": "assistant", "content": str(bot_msg)} | |
]) | |
# Add current message | |
formatted_messages.append({ | |
"role": "user", | |
"content": str(message) | |
}) | |
try: | |
bot_message = "" | |
current_history = list(chat_history) | |
for response_chunk in client.chat_completion( | |
formatted_messages, | |
max_tokens=MAX_TOKENS, | |
stream=True, | |
temperature=TEMPERATURE, | |
top_p=TOP_P | |
): | |
if hasattr(response_chunk.choices[0].delta, 'content'): | |
delta = response_chunk.choices[0].delta.content | |
if delta: | |
bot_message += delta | |
if len(bot_message.strip()) >= MIN_RESPONSE_LENGTH: | |
new_history = current_history + [(message, bot_message)] | |
yield new_history | |
if bot_message: # Ensure final message is yielded | |
final_history = current_history + [(message, bot_message)] | |
yield final_history | |
except Exception as e: | |
error_message = f"Story magic temporarily interrupted. Please try again. (Error: {str(e)})" | |
error_history = current_history + [(message, error_message)] | |
yield error_history | |
def save_story(chat_history): | |
"""Convert chat history to markdown for download""" | |
if not chat_history: | |
return "No story to save yet!" | |
story_text = "# My Interactive Adventure\n\n" | |
for user_msg, bot_msg in chat_history: | |
story_text += f"**Player:** {user_msg}\n\n" | |
story_text += f"**Story:** {bot_msg}\n\n---\n\n" | |
return story_text | |
with gr.Blocks(theme=gr.themes.Soft()) as demo: | |
gr.Markdown("# 🔮 Interactive Story Time") | |
with gr.Row(): | |
status_message = gr.Markdown("Ready to begin your adventure...", visible=True) | |
gr.Markdown("Create a completely unique literary world, one choice at a time. Dare to explore the unknown.") | |
with gr.Row(): | |
with gr.Column(scale=3): | |
# Chat window + user input | |
chatbot = gr.Chatbot( | |
height=500, # Increased height | |
bubble_full_width=True, # Allow bubbles to use full width | |
show_copy_button=True, | |
avatar_images=(None, "🧙"), | |
type="messages", | |
container=True, | |
scale=1, | |
min_width=800 # Ensure minimum width | |
) | |
msg = gr.Textbox( | |
placeholder="Describe what you want to do next in the story...", | |
container=False, | |
scale=4, | |
) | |
with gr.Row(): | |
submit = gr.Button("Continue Story", variant="primary") | |
clear = gr.Button("Start New Adventure") | |
with gr.Column(scale=1): | |
gr.Markdown("## Adventure Settings") | |
genre = gr.Dropdown( | |
choices=list(GENRE_EXAMPLES.keys()), | |
label="Story Genre", | |
info="Choose the theme of your next adventure", | |
value="fantasy" | |
) | |
full_memory = gr.Checkbox( | |
label="Full Story Memory", | |
value=True, | |
info="When enabled, the AI tries to remember the entire story. If disabled, only the last few exchanges are used." | |
) | |
gr.Markdown("## Story Starters") | |
# Create four placeholder buttons for story starters | |
starter_btn1 = gr.Button("Starter 1") | |
starter_btn2 = gr.Button("Starter 2") | |
starter_btn3 = gr.Button("Starter 3") | |
starter_btn4 = gr.Button("Starter 4") | |
starter_buttons = [starter_btn1, starter_btn2, starter_btn3, starter_btn4] | |
# 1) We'll return a list of 4 dicts, each dict updating 'value' & 'visible' | |
def update_starter_buttons(selected_genre): | |
"""Update starter buttons with examples for the selected genre.""" | |
examples = get_examples_for_genre(selected_genre) | |
results = [] | |
for i in range(4): | |
if i < len(examples): | |
# Return just the string value instead of a dict | |
results.append(examples[i]) | |
else: | |
results.append("") # Empty string for hidden buttons | |
return tuple(results) # Return tuple of strings | |
# 2) Initialize them with "fantasy" so they don't stay "Starter X" on page load | |
# We'll just call the function and store the results in a variable, then apply them in a .load() event | |
initial_button_data = update_starter_buttons("fantasy") # returns 4 dicts | |
# 3) We'll define a "pick_starter" function that sets msg to the chosen text | |
def pick_starter(starter_text, chat_history, selected_genre, memory_flag): | |
# Putting 'starter_text' into the msg | |
return starter_text | |
# 4) Connect each starter button: | |
for starter_button in starter_buttons: | |
starter_button.click( | |
fn=lambda x: [(x, "")], # Changed to return properly formatted history | |
inputs=[starter_button], | |
outputs=[chatbot], | |
queue=False | |
).then( # Chain the response after showing user message | |
fn=respond, | |
inputs=[starter_button, chatbot, genre, full_memory], | |
outputs=[chatbot], | |
queue=True | |
) | |
# 5) Dynamically update the 4 buttons if the user changes the genre | |
genre.change( | |
fn=update_starter_buttons, | |
inputs=[genre], | |
outputs=starter_buttons | |
) | |
# Handler for user input | |
msg.submit(respond, [msg, chatbot, genre, full_memory], [chatbot]) | |
submit.click(respond, [msg, chatbot, genre, full_memory], [chatbot]) | |
# Clear the chatbot for a new adventure | |
clear.click(lambda: [], None, chatbot, queue=False) | |
clear.click(lambda: "", None, msg, queue=False) | |
# "Download My Story" row | |
with gr.Row(): | |
save_btn = gr.Button("Download My Story", variant="secondary") | |
story_output = gr.Markdown(visible=False) | |
save_btn.click(save_story, inputs=[chatbot], outputs=[story_output]) | |
save_btn.click( | |
fn=lambda: True, | |
inputs=None, | |
outputs=story_output, | |
js="() => {document.getElementById('story_output').scrollIntoView();}", | |
queue=False | |
) | |
# 6) Finally, run a "load" event to apply initial_button_data to the 4 button outputs on page load | |
def load_initial_buttons(): | |
# Just return our precomputed tuple of 4 dicts | |
return initial_button_data | |
demo.load(fn=load_initial_buttons, outputs=starter_buttons, queue=False) | |
# Run the app | |
if __name__ == "__main__": | |
demo.launch(server_name="0.0.0.0", server_port=7860) | |