import os import time from typing import List, Tuple, Optional import google.generativeai as genai import gradio as gr from PIL import Image print("google-generativeai:", genai.__version__) GOOGLE_API_KEY = os.environ.get("GOOGLE_API_KEY") TITLE = """

đŸ•šī¸ Google Gemini Chatbot đŸ”Ĩ

""" SUBTITLE = """

🎨 Create with Multimodal Gemini

""" DUPLICATE = """
Duplicate Space Duplicate the Space and run securely with your GOOGLE API KEY.
""" IMAGE_WIDTH = 512 def preprocess_stop_sequences(stop_sequences: str) -> Optional[List[str]]: return [seq.strip() for seq in stop_sequences.split(",")] if stop_sequences else None def preprocess_image(image: Image.Image) -> Image.Image: image_height = int(image.height * IMAGE_WIDTH / image.width) return image.resize((IMAGE_WIDTH, image_height)) def user(text_prompt: str, chatbot: List[Tuple[str, str]]): return "", chatbot + [[text_prompt, None]] def bot( google_key: str, image_prompt: Optional[Image.Image], text_prompt: str, temperature: float, max_output_tokens: int, stop_sequences: str, top_k: int, top_p: float, chatbot: List[Tuple[str, str]] ): google_key = google_key or GOOGLE_API_KEY if not google_key: raise ValueError("GOOGLE_API_KEY is not set. Please set it up.") genai.configure(api_key=google_key) instructions = "You are an expert stylist. You suggest and evaluate any style-related question to make anyone, regardless of gender, race, or any other demographic diversity, look stylish." model_name = 'gemini-pro-vision' if image_prompt else 'gemini-1.5-pro-latest' inputs = [text_prompt, instructions] if image_prompt: inputs.append(preprocess_image(image_prompt)) model = genai.GenerativeModel(model_name) response = model.generate_content(inputs, stream=True, generation_config=genai.types.GenerationConfig( temperature=temperature, max_output_tokens=max_output_tokens, stop_sequences=preprocess_stop_sequences(stop_sequences), top_k=top_k, top_p=top_p )) response.resolve() chatbot[-1][1] = "" for chunk in response: for i in range(0, len(chunk.text), 10): chatbot[-1][1] += chunk.text[i:i + 10] time.sleep(0.01) yield chatbot google_key_component = gr.Textbox( label="GOOGLE API KEY", type="password", placeholder="Enter your Google API Key", visible=GOOGLE_API_KEY is None ) image_prompt_component = gr.Image(type="pil", label="Upload Image", width=200) text_prompt_component = gr.Textbox( placeholder="Describe your style needs", label="Enter your prompt", width=300 ) run_button_component = gr.Button("Ask Stylist") user_inputs = [text_prompt_component, chatbot_component] bot_inputs = [google_key_component, image_prompt_component, text_prompt_component, temperature_component, max_output_tokens_component, stop_sequences_component, top_k_component, top_p_component, chatbot_component] with gr.Blocks() as demo: gr.HTML(TITLE) gr.HTML(SUBTITLE) gr.HTML(DUPLICATE) with gr.Row(): google_key_component.render() with gr.Row(): text_prompt_component.render() image_prompt_component.render() chatbot_component = gr.Chatbot(label='Gemini Personal Stylist') chatbot_component.render() run_button_component.render() run_button_component.click( fn=user, inputs=user_inputs, outputs=[text_prompt_component, chatbot_component], queue=False ).then( fn=bot, inputs=bot_inputs, outputs=[chatbot_component] ) text_prompt_component.submit( fn=user, inputs=user_inputs, outputs=[text_prompt_component, chatbot_component], queue=False ).then( fn=bot, inputs=bot_inputs, outputs=[chatbot_component] ) demo.launch()