test-100

Running

App Files Files Community

Kims12 commited on Mar 19

Commit

451a0ee

verified ·

1 Parent(s): d53a3c8

Update app.py

Browse files

Files changed (1) hide show

app.py +98 -110

app.py CHANGED Viewed

@@ -10,11 +10,11 @@ from io import BytesIO
 from google import genai
 from google.genai import types
-# 환경변수 로드
 from dotenv import load_dotenv
 load_dotenv()
-# 로깅 설정
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 logger = logging.getLogger(__name__)
@@ -24,83 +24,83 @@ def save_binary_file(file_name, data):
 def preprocess_prompt(prompt, image1, image2, image3):
     """
-    프롬프트를 처리하고 기능 명령을 해석
     """
-    # 이미지 존재 여부 확인
     has_img1 = image1 is not None
     has_img2 = image2 is not None
     has_img3 = image3 is not None
-    # #1, #2, #3 참조를 설명으로 변환 (이미지가 없는 경우 무시)
     if "#1" in prompt:
-        prompt = prompt.replace("#1", "첫 번째 이미지" if has_img1 else "첫 번째 이미지(없음)")
     if "#2" in prompt:
-        prompt = prompt.replace("#2", "두 번째 이미지" if has_img2 else "두 번째 이미지(없음)")
     if "#3" in prompt:
-        prompt = prompt.replace("#3", "세 번째 이미지" if has_img3 else "세 번째 이미지(없음)")
-    # 기능 명령 해석
-    if "1. 이미지 변경" in prompt:
-        desc_match = re.search(r'#1을 "(.*?)"으로 바꿔라', prompt)
         if desc_match:
             description = desc_match.group(1)
-            prompt = f"첫 번째 이미지를 {description}으로 변경해주세요. 원본 이미지의 주요 내용은 유지하되 새로운 스타일과 분위기로 재해석해주세요."
         else:
-            prompt = "첫 번째 이미지를 창의적으로 변형해주세요. 더 생생하고 예술적인 버전으로 만들어주세요."
-    elif "2. 글자지우기" in prompt:
-        text_match = re.search(r'#1에서 "(.*?)"를 지워라', prompt)
         if text_match:
             text_to_remove = text_match.group(1)
-            prompt = f"첫 번째 이미지에서 '{text_to_remove}' 텍스트를 찾아 자연스럽게 제거해주세요. 텍스트가 있던 부분을 배경과 조화롭게 채워주세요."
         else:
-            prompt = "첫 번째 이미지에서 모든 텍스트를 찾아 자연스럽게 제거해주세요. 깔끔한 이미지로 만들어주세요."
-    elif "3. 얼굴바꾸기" in prompt:
-        prompt = "첫 번째 이미지의 인물 얼굴을 두 번째 이미지의 얼굴로 자연스럽게 교체해주세요. 얼굴의 표정과 특징은 두 번째 이미지를 따르되, 나머지 부분은 첫 번째 이미지를 유지해주세요."
-    elif "4. 옷바꾸기" in prompt:
-        if "#3" in prompt or "또는 #3" in prompt:
-            prompt = "첫 번째 이미지의 인물 의상을 두 번째 또는 세 번째 이미지의 의상으로 자연스럽게 교체해주세요. 의상의 스타일과 색상은 참조 이미지를 따르되, 신체 비율과 포즈는 첫 번째 이미지를 유지해주세요."
         else:
-            prompt = "첫 번째 이미지의 인물 의상을 두 번째 이미지의 의상으로 자연스럽게 교체해주세요. 의상의 스타일과 색상은 두 번째 이미지를 따르되, 신체 비율과 포즈는 첫 번째 이미지를 유지해주세��."
-    elif "5. 배경바꾸기" in prompt:
-        prompt = "첫 번째 이미지의 배경을 두 번째 이미지의 배경으로 자연스럽게 교체해주세요. 첫 번째 이미지의 주요 피사체는 유지하고, 두 번째 이미지의 배경과 조화롭게 합성해주세요."
-    elif "6. 이미지 합성(상품포함)" in prompt:
-        if "#3" in prompt or "또는 #3" in prompt:
-            prompt = "첫 번째 이미지와 두 번째, 세 번째 이미지를 자연스럽게 합성해주세요. 모든 이미지의 주요 요소를 포함하고, 특히 상품이 잘 보이도록 조화롭게 통합해주세요."
         else:
-            prompt = "첫 번째 이미지와 두 번째 이미지를 자연스럽게 합성해주세요. 두 이미지의 주요 요소를 포함하고, 특히 상품이 잘 보이도록 조화롭게 통합해주세요."
-    elif "7. 이미지 합성(스타일적용)" in prompt:
-        prompt = "첫 번째 이미지의 내용을 두 번째 이미지의 스타일로 변환해주세요. 첫 번째 이미지의 주요 피사체와 구도는 유지하되, 두 번째 이미지의 예술적 스타일, 색상, 질감을 적용해주세요."
-    elif "을 붉은색으로 바꿔라" in prompt or "를 붉은색으로 바꿔라" in prompt:
-        prompt = "첫 번째 이미지를 붉은색 톤으로 변경해주세요. 전체적인 색상을 붉은 계열로 조정하고 자연스러운 느낌을 유지해주세요."
-    prompt += " 이미지를 생성해주세요."
     return prompt
 def generate_with_images(prompt, images):
     """
-    API 호출을 통해 이미지를 생성하는 함수
     """
     try:
         api_key = os.environ.get("GEMINI_API_KEY")
         if not api_key:
-            return None, "API 키가 설정되지 않았습니다. 환경변수를 확인해주세요."
         client = genai.Client(api_key=api_key)
-        logger.info(f"Gemini API 요청 시작 - 프롬프트: {prompt}")
         contents = []
         contents.append(prompt)
         for idx, img in enumerate(images, 1):
             if img is not None:
                 contents.append(img)
-                logger.info(f"이미지 #{idx} 추가됨")
         response = client.models.generate_content(
             model="gemini-2.0-flash-exp-image-generation",
@@ -123,145 +123,134 @@ def generate_with_images(prompt, images):
             for part in response.candidates[0].content.parts:
                 if hasattr(part, 'text') and part.text:
                     result_text += part.text
-                    logger.info(f"응답 텍스트: {part.text}")
                 elif hasattr(part, 'inline_data') and part.inline_data:
                     save_binary_file(temp_path, part.inline_data.data)
                     image_found = True
-                    logger.info("응답에서 이미지 추출 성공")
             if not image_found:
-                return None, f"API에서 이미지를 생성하지 못했습니다. 응답 텍스트: {result_text}"
             result_img = Image.open(temp_path)
             if result_img.mode == "RGBA":
                 result_img = result_img.convert("RGB")
-            return result_img, f"이미지가 성공적으로 생성되었습니다. {result_text}"
     except Exception as e:
-        logger.exception("이미지 생성 중 오류 발생:")
-        return None, f"오류 발생: {str(e)}"
 def process_images_with_prompt(image1, image2, image3, prompt):
     """
-    3개의 이미지와 프롬프트를 처리하는 함수.
-    이미지가 업로드되지 않은 경우에도 프롬프트에 따라 이미지를 생성하며,
-    이미지 생성에 실패하면 최대 3회까지 재시도합니다.
     """
     try:
         images = [image1, image2, image3]
-        valid_images = [img for img in images if img is not None]  # 이미지가 없을 수도 있음
-        # 프롬프트 자동 생성 (업로드된 이미지 수에 따라)
         if not prompt or not prompt.strip():
             if len(valid_images) == 0:
-                prompt = "이 프롬프트에 맞춰 창의적으로 이미지를 생성해주세요."
-                logger.info("텍스트 전용 프롬프트 자동 생성")
             elif len(valid_images) == 1:
-                prompt = "이 이미지를 창의적으로 변형해주세요. 더 생생하고 예술적인 버전으로 만들어주세요."
-                logger.info("단일 이미지 프롬프트 자동 생성")
             elif len(valid_images) == 2:
-                prompt = "이 두 이미지를 자연스럽게 합성해주세요. 두 이미지의 요소를 조화롭게 통합하여 하나의 이미지로 만들어주세요."
-                logger.info("두 이미지 합성 프롬프트 자동 생성")
             else:
-                prompt = "이 세 이미지를 창의적으로 합성해주세요. 모든 이미지의 주요 요소를 포함하되 자연스럽고 일관된 하나의 장면으로 만들어주세요."
-                logger.info("세 이미지 합성 프롬프트 자동 생성")
         else:
             prompt = preprocess_prompt(prompt, image1, image2, image3)
-        # 최대 3회까지 재시도
         max_retries = 3
         for attempt in range(max_retries):
             result_img, status = generate_with_images(prompt, valid_images)
             if result_img is not None:
                 return result_img, status
             else:
-                logger.info(f"이미지 생성 실패, 재시도 중 ({attempt+1}/{max_retries})")
-        return None, f"이미지 생성에 실패하였습니다. 마지막 상태: {status}"
     except Exception as e:
-        logger.exception("이미지 처리 중 오류 발생:")
-        return None, f"오류 발생: {str(e)}"
 def update_prompt_from_function(function_choice):
     """
-    기능 선택에 따라 프롬프트 템플릿을 반환합니다.
-    (커스텀 텍스트 입력은 제거되었습니다.)
     """
     function_templates = {
-        "1. 이미지 변경": '#1을 "원하는 설명"으로 바꿔라',
-        "2. 글자지우기": '#1에서 "지울 텍스트"를 지워라',
-        "3. 얼굴바꾸기": "#1의 인물을 #2의 얼굴로 바꿔라",
-        "4. 옷바꾸기": "#1의 인물에 #2 또는 #3의 옷으로 변경하라",
-        "5. 배경바꾸기": "#1의 이미지에 #2의 배경으로 자연스럽게 바꿔라",
-        "6. 이미지 합성(상품포함)": "#1와 #2 또는 #3의 를 합성하라",
-        "7. 이미지 합성(스타��적용)": "#1와 #2를 스타일로 변환하라"
     }
     return function_templates.get(function_choice, "")
-# Gradio 인터페이스 구성
 with gr.Blocks() as demo:
     gr.HTML(
         """
         <div style="text-align: center; margin-bottom: 1rem;">
-            <h1>간단한 이미지 생성기</h1>
-            <p>프롬프트만 입력해도 이미지가 생성됩니다. 또한, 기능 선택만으로 프롬프트에 적용할 수 있습니다.</p>
         </div>
         """
     )
     with gr.Row():
         with gr.Column():
-            # 3개의 이미지 입력 (업로드하지 않아도 됨)
             with gr.Row():
                 image1_input = gr.Image(type="pil", label="#1", image_mode="RGB")
                 image2_input = gr.Image(type="pil", label="#2", image_mode="RGB")
                 image3_input = gr.Image(type="pil", label="#3", image_mode="RGB")
-            # 기능 선택 드롭다운 (커스텀 텍스트 입력 제거)
             function_dropdown = gr.Dropdown(
                 choices=[
-                    "1. 이미지 변경",
-                    "2. 글자지우기",
-                    "3. 얼굴바꾸기",
-                    "4. 옷바꾸기",
-                    "5. 배경바꾸기",
-                    "6. 이미지 합성(상품포함)",
-                    "7. 이미지 합성(스타일적용)"
                 ],
-                label="기능 선택",
                 value=None
             )
-            # 프롬프트 입력 (선택 사항)
             prompt_input = gr.Textbox(
                 lines=3,
-                placeholder="프롬프트를 입력하거나 비워두면 자동 생성됩니다.",
-                label="프롬프트 (선택 사항)"
             )
-            # 생성 버튼
-            submit_btn = gr.Button("이미지 생성", variant="primary")
         with gr.Column():
-            # 결과 출력
-            output_image = gr.Image(label="생성된 이미지")
-            output_text = gr.Textbox(label="상태 메시지")
-            # 사용된 프롬프트 표시
-            prompt_display = gr.Textbox(label="사용된 프롬프트", visible=True)
-    # 기능 선택 드롭다운 변경 시 프롬프트 업데이트 (apply 버튼 없이 바로 적용)
     function_dropdown.change(
         fn=update_prompt_from_function,
         inputs=[function_dropdown],
         outputs=[prompt_input]
     )
-    # 이미지 생성 버튼 클릭 이벤트
     def process_and_show_prompt(image1, image2, image3, prompt):
-        # 이미지 개수 확인
         images = [image1, image2, image3]
         valid_images = [img for img in images if img is not None]
@@ -269,13 +258,13 @@ with gr.Blocks() as demo:
             auto_prompt = prompt
             if not prompt or not prompt.strip():
                 if len(valid_images) == 0:
-                    auto_prompt = "이 프롬프트에 맞춰 창의적으로 이미지를 생성해주세요."
                 elif len(valid_images) == 1:
-                    auto_prompt = "이 이미지를 창의적으로 변형해주세요. 더 생생하고 예술적인 버전으로 만들어주세요."
                 elif len(valid_images) == 2:
-                    auto_prompt = "이 두 이미지를 자연스럽게 합성해주세요. 두 이미지의 요소를 조화롭게 통합하여 하나의 이미지로 만들어주세요."
                 else:
-                    auto_prompt = "이 세 이미지를 창의적으로 합성해주세요. 모든 이미지의 주요 요소를 포함하되 자연스럽고 일관된 하나의 장면으로 만들어주세요."
             else:
                 auto_prompt = preprocess_prompt(prompt, image1, image2, image3)
@@ -283,8 +272,8 @@ with gr.Blocks() as demo:
             return result_img, status, auto_prompt
         except Exception as e:
-            logger.exception("처리 중 오류 발생:")
-            return None, f"오류 발생: {str(e)}", prompt
     submit_btn.click(
         fn=process_and_show_prompt,
@@ -294,15 +283,14 @@ with gr.Blocks() as demo:
     gr.Markdown(
         """
-        ### 사용 방법:
-        1. **텍스트 전용 생성**: 이미지를 업로드하지 않고 프롬프트만 입력해도 이미지를 생성할 수 있습니다.
-        2. **기능 선택**: 드롭다운에서 원하는 기능을 선택하면 해당 기능의 템플릿이 프롬프트에 자동 반영됩니다.
-        3. **이미지 업로드**: 일부 또는 전체 이미지를 업로드해도 기능이 정상적으로 동작합니다.
-        4. **자동 재시도**: 이미지 생성 중 오류가 발생하면 최대 2회 추가 재시도합니다.
         """
     )
-# 애플리케이션 실행
 if __name__ == "__main__":
     demo.launch(share=True)

 from google import genai
 from google.genai import types
+# Load environment variables
 from dotenv import load_dotenv
 load_dotenv()
+# Logging configuration
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 logger = logging.getLogger(__name__)
 def preprocess_prompt(prompt, image1, image2, image3):
     """
+    Process the prompt and interpret function commands.
     """
+    # Check for image existence
     has_img1 = image1 is not None
     has_img2 = image2 is not None
     has_img3 = image3 is not None
+    # Replace #1, #2, #3 with description (if image is missing, note it)
     if "#1" in prompt:
+        prompt = prompt.replace("#1", "first image" if has_img1 else "first image (none)")
     if "#2" in prompt:
+        prompt = prompt.replace("#2", "second image" if has_img2 else "second image (none)")
     if "#3" in prompt:
+        prompt = prompt.replace("#3", "third image" if has_img3 else "third image (none)")
+    # Interpret function commands
+    if "1. Change Image" in prompt:
+        desc_match = re.search(r'#1 to "(.*?)"', prompt)
         if desc_match:
             description = desc_match.group(1)
+            prompt = f"Please change the first image to {description}. Reinterpret it with a new style and mood while preserving its main content."
         else:
+            prompt = "Please creatively transform the first image into a more vivid and artistic version."
+    elif "2. Remove Text" in prompt:
+        text_match = re.search(r'remove "(.*?)" from #1', prompt)
         if text_match:
             text_to_remove = text_match.group(1)
+            prompt = f"Please find and naturally remove the text '{text_to_remove}' from the first image, filling the area with a harmonious background."
         else:
+            prompt = "Please naturally remove all text from the first image to create a clean look."
+    elif "3. Replace Face" in prompt:
+        prompt = "Please seamlessly replace the face in the first image with the face from the second image. Follow the expression and features of the second image while keeping the rest of the first image intact."
+    elif "4. Change Outfit" in prompt:
+        if "#3" in prompt or "or #3" in prompt:
+            prompt = "Please seamlessly change the outfit in the first image to the outfit from the second or third image. Follow the style and color of the referenced image while maintaining the body proportions and pose of the first image."
         else:
+            prompt = "Please seamlessly change the outfit in the first image to the outfit from the second image. Follow the style and color of the second image while maintaining the body proportions and pose of the first image."
+    elif "5. Change Background" in prompt:
+        prompt = "Please seamlessly replace the background of the first image with the background from the second image, keeping the main subject intact and harmoniously merging with the new background."
+    elif "6. Blend Images (with product)" in prompt:
+        if "#3" in prompt or "or #3" in prompt:
+            prompt = "Please seamlessly blend the first, second, and third images into one image, ensuring that all key elements are included, especially the product."
         else:
+            prompt = "Please seamlessly blend the first and second images into one image, ensuring that all key elements are included, especially the product."
+    elif "7. Apply Style" in prompt:
+        prompt = "Please transform the content of the first image into the style of the second image, preserving its main subject and composition while applying the artistic style, colors, and texture of the second image."
+    elif "change to red" in prompt:
+        prompt = "Please change the first image to a red tone. Adjust the overall colors to red hues while maintaining a natural look."
+    prompt += " Please generate the image."
     return prompt
 def generate_with_images(prompt, images):
     """
+    Generate an image via the API call.
     """
     try:
         api_key = os.environ.get("GEMINI_API_KEY")
         if not api_key:
+            return None, "API key is not set. Please check your environment variables."
         client = genai.Client(api_key=api_key)
+        logger.info(f"Starting Gemini API request - Prompt: {prompt}")
         contents = []
         contents.append(prompt)
         for idx, img in enumerate(images, 1):
             if img is not None:
                 contents.append(img)
+                logger.info(f"Added image #{idx}")
         response = client.models.generate_content(
             model="gemini-2.0-flash-exp-image-generation",
             for part in response.candidates[0].content.parts:
                 if hasattr(part, 'text') and part.text:
                     result_text += part.text
+                    logger.info(f"Response text: {part.text}")
                 elif hasattr(part, 'inline_data') and part.inline_data:
                     save_binary_file(temp_path, part.inline_data.data)
                     image_found = True
+                    logger.info("Successfully extracted image from response")
             if not image_found:
+                return None, f"API did not generate an image. Response text: {result_text}"
             result_img = Image.open(temp_path)
             if result_img.mode == "RGBA":
                 result_img = result_img.convert("RGB")
+            return result_img, f"Image successfully generated. {result_text}"
     except Exception as e:
+        logger.exception("Error occurred during image generation:")
+        return None, f"Error occurred: {str(e)}"
 def process_images_with_prompt(image1, image2, image3, prompt):
     """
+    Process three images and a prompt.
+    Generates an image based on the prompt even if no images are uploaded,
+    and retries up to 3 times if generation fails.
     """
     try:
         images = [image1, image2, image3]
+        valid_images = [img for img in images if img is not None]
         if not prompt or not prompt.strip():
             if len(valid_images) == 0:
+                prompt = "Please creatively generate an image based on this prompt."
+                logger.info("Automatically generated text-only prompt")
             elif len(valid_images) == 1:
+                prompt = "Please creatively transform this image into a more vivid and artistic version."
+                logger.info("Automatically generated single image prompt")
             elif len(valid_images) == 2:
+                prompt = "Please seamlessly blend these two images into one, integrating the elements harmoniously."
+                logger.info("Automatically generated two-image blending prompt")
             else:
+                prompt = "Please creatively blend these three images into one cohesive scene, including all main elements."
+                logger.info("Automatically generated three-image blending prompt")
         else:
             prompt = preprocess_prompt(prompt, image1, image2, image3)
         max_retries = 3
         for attempt in range(max_retries):
             result_img, status = generate_with_images(prompt, valid_images)
             if result_img is not None:
                 return result_img, status
             else:
+                logger.info(f"Image generation failed, retrying ({attempt+1}/{max_retries})")
+        return None, f"Failed to generate image. Last status: {status}"
     except Exception as e:
+        logger.exception("Error occurred during image processing:")
+        return None, f"Error occurred: {str(e)}"
 def update_prompt_from_function(function_choice):
     """
+    Returns a prompt template based on the selected function.
+    (Custom text input has been removed.)
     """
     function_templates = {
+        "1. Change Image": '#1 to "desired description"',
+        "2. Remove Text": 'remove "text to remove" from #1',
+        "3. Replace Face": "replace the face in #1 with the face from #2",
+        "4. Change Outfit": "change the outfit in #1 to that from #2 or #3",
+        "5. Change Background": "change the background of #1 to the background from #2",
+        "6. Blend Images (with product)": "blend #1 with #2 or #3",
+        "7. Apply Style": "apply the style of #2 to #1"
     }
     return function_templates.get(function_choice, "")
+# Gradio Interface
 with gr.Blocks() as demo:
     gr.HTML(
         """
         <div style="text-align: center; margin-bottom: 1rem;">
+            <h1>Simple Image Generator</h1>
+            <p>You can generate an image by entering only a prompt. Alternatively, you can select a function below.</p>
         </div>
         """
     )
     with gr.Row():
         with gr.Column():
             with gr.Row():
                 image1_input = gr.Image(type="pil", label="#1", image_mode="RGB")
                 image2_input = gr.Image(type="pil", label="#2", image_mode="RGB")
                 image3_input = gr.Image(type="pil", label="#3", image_mode="RGB")
             function_dropdown = gr.Dropdown(
                 choices=[
+                    "1. Change Image",
+                    "2. Remove Text",
+                    "3. Replace Face",
+                    "4. Change Outfit",
+                    "5. Change Background",
+                    "6. Blend Images (with product)",
+                    "7. Apply Style"
                 ],
+                label="Select Function",
                 value=None
             )
             prompt_input = gr.Textbox(
                 lines=3,
+                placeholder="Enter a prompt or leave blank for automatic generation.",
+                label="Prompt (optional)"
             )
+            submit_btn = gr.Button("Generate Image", variant="primary")
         with gr.Column():
+            output_image = gr.Image(label="Generated Image")
+            output_text = gr.Textbox(label="Status Message")
+            prompt_display = gr.Textbox(label="Used Prompt", visible=True)
+    # Update prompt textbox when function is selected
     function_dropdown.change(
         fn=update_prompt_from_function,
         inputs=[function_dropdown],
         outputs=[prompt_input]
     )
     def process_and_show_prompt(image1, image2, image3, prompt):
         images = [image1, image2, image3]
         valid_images = [img for img in images if img is not None]
             auto_prompt = prompt
             if not prompt or not prompt.strip():
                 if len(valid_images) == 0:
+                    auto_prompt = "Please creatively generate an image based on this prompt."
                 elif len(valid_images) == 1:
+                    auto_prompt = "Please creatively transform this image into a more vivid and artistic version."
                 elif len(valid_images) == 2:
+                    auto_prompt = "Please seamlessly blend these two images into one, integrating the elements harmoniously."
                 else:
+                    auto_prompt = "Please creatively blend these three images into one cohesive scene, including all main elements."
             else:
                 auto_prompt = preprocess_prompt(prompt, image1, image2, image3)
             return result_img, status, auto_prompt
         except Exception as e:
+            logger.exception("Error occurred during processing:")
+            return None, f"Error occurred: {str(e)}", prompt
     submit_btn.click(
         fn=process_and_show_prompt,
     gr.Markdown(
         """
+        ### Usage:
+        1. **Text-Only Generation:** Generate an image without uploading any image by simply entering a prompt.
+        2. **Select Function:** Choose a function from the dropdown and the corresponding template will automatically apply to the prompt.
+        3. **Image Upload:** Upload one or more images to apply the function accordingly.
+        4. **Automatic Retry:** If image generation fails, it will automatically retry up to 2 additional times.
         """
     )
 if __name__ == "__main__":
     demo.launch(share=True)