test-100

Running

App Files Files Community

Kims12 commited on Mar 18

Commit

2c23e83

verified ·

1 Parent(s): 691b233

Update app.py

Browse files

Files changed (1) hide show

app.py +73 -66

app.py CHANGED Viewed

@@ -12,45 +12,41 @@ import logging
 from google import genai
 from google.genai import types
-# .env 파일에 저장된 환경변수 로드 (python-dotenv 설치 필요: pip install python-dotenv)
-from dotenv import load_dotenv
-load_dotenv()
-# 로깅 설정 (로그 레벨: DEBUG)
 logging.basicConfig(level=logging.DEBUG,
                     format='%(asctime)s - %(levelname)s - %(message)s')
 logger = logging.getLogger(__name__)
 def save_binary_file(file_name, data):
-    logger.debug(f"파일에 이진 데이터 저장 중: {file_name}")
     with open(file_name, "wb") as f:
         f.write(data)
-    logger.debug(f"파일 저장 완료: {file_name}")
-def generate(text, file_name, model="gemini-2.0-flash-exp-image-generation"):
-    logger.debug(f"generate 함수 시작 - 텍스트: '{text}', 파일명: '{file_name}', 모델: '{model}'")
     try:
-        # API 키는 환경변수에서 불러옴
-        effective_api_key = os.environ.get("GEMINI_API_KEY")
-        if effective_api_key:
-            logger.debug("환경변수에서 API 키 불러옴")
-        else:
-            logger.error("API 키가 환경변수에 설정되지 않았습니다.")
-            raise ValueError("API 키가 필요합니다.")
         client = genai.Client(api_key=effective_api_key)
-        logger.debug("Gemini 클라이언트 초기화 완료.")
-        # 파일 업로드
         files = [
             client.files.upload(file=file_name),
         ]
-        logger.debug(f"파일 업로드 완료. URI: {files[0].uri}, MIME 타입: {files[0].mime_type}")
-        # 컨텐츠 객체 생성: 파일 URI와 텍스트 프롬프트를 함께 포함
         contents = [
             types.Content(
                 role="user",
@@ -63,7 +59,7 @@ def generate(text, file_name, model="gemini-2.0-flash-exp-image-generation"):
                 ],
             ),
         ]
-        logger.debug(f"컨텐츠 객체 생성 완료: {contents}")
         generate_content_config = types.GenerateContentConfig(
             temperature=1,
@@ -76,11 +72,11 @@ def generate(text, file_name, model="gemini-2.0-flash-exp-image-generation"):
             ],
             response_mime_type="text/plain",
         )
-        logger.debug(f"생성 설정: {generate_content_config}")
         with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
             temp_path = tmp.name
-            logger.debug(f"임시 파일 생성됨: {temp_path}")
             response_stream = client.models.generate_content_stream(
                 model=model,
@@ -88,106 +84,117 @@ def generate(text, file_name, model="gemini-2.0-flash-exp-image-generation"):
                 config=generate_content_config,
             )
-            logger.debug("응답 스트림 처리 시작...")
             for chunk in response_stream:
                 if not chunk.candidates or not chunk.candidates[0].content or not chunk.candidates[0].content.parts:
-                    logger.warning("chunk에 후보, 컨텐츠, 또는 파트가 없습니다. 건너뜁니다.")
                     continue
                 inline_data = chunk.candidates[0].content.parts[0].inline_data
                 if inline_data:
                     save_binary_file(temp_path, inline_data.data)
-                    logger.info(f"MIME 타입 {inline_data.mime_type}의 파일이 저장됨: {temp_path} (프롬프트: {text})")
                 else:
-                    logger.info(f"수신된 텍스트: {chunk.text}")
-                    print(chunk.text)
                 logger.debug(f"Raw chunk: {chunk}")
         del files
-        logger.debug("업로드된 파일 정보 삭제 완료.")
         return temp_path
     except Exception as e:
-        logger.exception("이미지 생성 중 오류 발생:")
-        return None  # 오류 발생 시 None 반환
-def process_image_and_prompt(composite_pil, prompt):
-    logger.debug(f"process_image_and_prompt 함수 시작 - 프롬프트: '{prompt}'")
     try:
         with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
             composite_path = tmp.name
             composite_pil.save(composite_path)
-            logger.debug(f"합성 이미지 저장 완료: {composite_path}")
         file_name = composite_path
         input_text = prompt
-        model = "gemini-2.0-flash-exp-image-generation"
-        gemma_edited_image_path = generate(text=input_text, file_name=file_name, model=model)
-        if gemma_edited_image_path:
-            logger.debug(f"이미지 생성 완료. 경로: {gemma_edited_image_path}")
             result_img = Image.open(gemma_edited_image_path)
             if result_img.mode == "RGBA":
                 result_img = result_img.convert("RGB")
             return [result_img]
         else:
-            logger.error("generate 함수에서 None 반환됨.")
-            return []  # 오류 시 빈 리스트 반환
     except Exception as e:
-        logger.exception("process_image_and_prompt 함수에서 오류 발생:")
-        return []  # 오류 시 빈 리스트 반환
-# --- Gradio 인터페이스 구성 ---
 with gr.Blocks() as demo:
     gr.HTML(
         """
         <div style='display: flex; align-items: center; justify-content: center; gap: 20px'>
-            <div style="background-color: var(--block-background-fill); border-radius: 8px">
-                <img src="https://www.gstatic.com/lamda/images/gemini_favicon_f069958c85030456e93de685481c559f160ea06b.png" style="width: 100px; height: 100px;">
-            </div>
-            <div>
-                <h1>Gemini를 이용한 이미지 편집</h1>
-                <p>Gemini API 키는 환경변수(GEMINI_API_KEY)로 설정되어 있습니다.</p>
-            </div>
         </div>
         """
     )
-    gr.Markdown("이미지를 업로드하고, 편집할 내용을 입력하세요.")
     with gr.Row():
         with gr.Column():
-            image_input = gr.Image(type="pil", label="이미지 업로드", image_mode="RGBA")
             prompt_input = gr.Textbox(
                 lines=2,
-                placeholder="편집할 내용을 입력하세요...",
-                label="편집 프롬프트"
             )
-            submit_btn = gr.Button("이미지 편집 실행")
         with gr.Column():
-            output_gallery = gr.Gallery(label="편집 결과")
     submit_btn.click(
         fn=process_image_and_prompt,
-        inputs=[image_input, prompt_input],
         outputs=output_gallery,
     )
-# --- 테스트 코드 ---
-# 테스트용 더미 이미지 (실제 이미지로 대체 가능)
 dummy_image = Image.new("RGBA", (100, 100), color="red")
-dummy_prompt = "이미지를 파란색으로 변경해줘"
-logger.info("process_image_and_prompt 함수를 직접 호출합니다...")
-result = process_image_and_prompt(dummy_image, dummy_prompt)
 if result:
-    logger.info(f"직접 호출 성공. 결과: {result}")
 else:
-    logger.error("직접 호출 실패.")
-demo.launch(share=True)

 from google import genai
 from google.genai import types
+# Configure logging
 logging.basicConfig(level=logging.DEBUG,
                     format='%(asctime)s - %(levelname)s - %(message)s')
 logger = logging.getLogger(__name__)
 def save_binary_file(file_name, data):
+    logger.debug(f"Saving binary data to file: {file_name}")
     with open(file_name, "wb") as f:
         f.write(data)
+    logger.debug(f"File saved successfully: {file_name}")
+def generate(text, file_name, api_key, model="gemini-2.0-flash-exp-image-generation"):
+    logger.debug(f"Starting generate function with text: '{text}', file_name: '{file_name}', model: '{model}'")
     try:
+        # Initialize client
+        effective_api_key = api_key.strip() if api_key and api_key.strip() != "" else os.environ.get("GEMINI_API_KEY")
+        logger.debug(f"Using API Key: {'Provided' if api_key.strip() else 'From Environment Variable'}")
+        if not effective_api_key:
+            logger.error("No API key provided or found in environment variable.")
+            raise ValueError("API key is required.")
         client = genai.Client(api_key=effective_api_key)
+        logger.debug("Gemini client initialized.")
         files = [
             client.files.upload(file=file_name),
         ]
+        logger.debug(f"File uploaded. URI: {files[0].uri}, MIME Type: {files[0].mime_type}")
         contents = [
             types.Content(
                 role="user",
                 ],
             ),
         ]
+        logger.debug(f"Content object created: {contents}")
         generate_content_config = types.GenerateContentConfig(
             temperature=1,
             ],
             response_mime_type="text/plain",
         )
+        logger.debug(f"Generate content config: {generate_content_config}")
         with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
             temp_path = tmp.name
+            logger.debug(f"Temporary file created: {temp_path}")
             response_stream = client.models.generate_content_stream(
                 model=model,
                 config=generate_content_config,
             )
+            logger.debug("Starting to process response stream...")
             for chunk in response_stream:
                 if not chunk.candidates or not chunk.candidates[0].content or not chunk.candidates[0].content.parts:
+                    logger.warning("Chunk has no candidates, content, or parts. Skipping.")
                     continue
                 inline_data = chunk.candidates[0].content.parts[0].inline_data
                 if inline_data:
                     save_binary_file(temp_path, inline_data.data)
+                    logger.info(f"File of mime type {inline_data.mime_type} saved to: {temp_path} and prompt input :{text}")
                 else:
+                    logger.info(f"Received text: {chunk.text}")
+                    print(chunk.text) # Keep the print for immediate console output
+                # Log the raw chunk for deeper inspection
                 logger.debug(f"Raw chunk: {chunk}")
         del files
+        logger.debug("Uploaded files deleted.")
         return temp_path
     except Exception as e:
+        logger.exception("An error occurred during generation:")  # This will log the full traceback
+        return None # Return None when error happens
+def process_image_and_prompt(composite_pil, prompt, gemini_api_key):
+    logger.debug(f"Starting process_image_and_prompt with prompt: '{prompt}'")
     try:
         with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
             composite_path = tmp.name
             composite_pil.save(composite_path)
+            logger.debug(f"Composite image saved to: {composite_path}")
         file_name = composite_path
         input_text = prompt
+        model = "gemini-2.0-flash-exp-image-generation"  #  Consider changing this to "gemini-pro-vision"
+        gemma_edited_image_path = generate(text=input_text, file_name=file_name, api_key=gemini_api_key, model=model)
+        if gemma_edited_image_path: # Check none or not
+            logger.debug(f"Image generated at path: {gemma_edited_image_path}")
             result_img = Image.open(gemma_edited_image_path)
             if result_img.mode == "RGBA":
                 result_img = result_img.convert("RGB")
             return [result_img]
         else:
+            logger.error("generate function returned None.")
+            return []  # Return empty when error
     except Exception as e:
+        logger.exception("Error occurred in process_image_and_prompt")
+        return []  # Return empty when error
+# --- Gradio Interface ---
 with gr.Blocks() as demo:
     gr.HTML(
         """
         <div style='display: flex; align-items: center; justify-content: center; gap: 20px'>
+        <div style="background-color: var(--block-background-fill); border-radius: 8px">
+            <img src="https://www.gstatic.com/lamda/images/gemini_favicon_f069958c85030456e93de685481c559f160ea06b.png" style="width: 100px; height: 100px;">
+        </div>
+        <div>
+            <h1></h1>
+            <p>ပုံရိပ်တည်းဖြတ်ရန် Gemini</p>
+            <p>API Key ကို <a href="https://aistudio.google.com/apikey">ဤနေရာ</a> တွင် ဖန်တီးပါ</p>
+        </div>
         </div>
         """
     )
+    gr.Markdown("ပုံတစ်ပုံ တင်ပြီး ပုံကိုတည်းဖြတ်ရန် သင်လိုချင်တာကို ရိုက်ထည့်ပါ။")
     with gr.Row():
         with gr.Column():
+            image_input = gr.Image(type="pil", label="ပုံတင်ရန်", image_mode="RGBA")
+            gemini_api_key = gr.Textbox(
+                lines=1,
+                placeholder="Gemini API Key ထည့်ပါ",
+                label="Gemini API Key",
+                type="password"
+            )
             prompt_input = gr.Textbox(
                 lines=2,
+                placeholder="သင်လိုချင်တာကို ဤနေရာတွင် ရိုက်ထည့်ပါ...",
+                label="သင်လိုချင်တာ"
             )
+            submit_btn = gr.Button("ထုတ်လုပ်ပါ")
         with gr.Column():
+            output_gallery = gr.Gallery(label="ထုတ်လုပ်ပြီးရလဒ်များ")
     submit_btn.click(
         fn=process_image_and_prompt,
+        inputs=[image_input, prompt_input, gemini_api_key],
         outputs=output_gallery,
     )
+# --- Test Code ---
+# Create a dummy image (replace with your actual image if needed)
 dummy_image = Image.new("RGBA", (100, 100), color="red")
+dummy_prompt = "Make the image blue"
+dummy_api_key = os.environ.get("GEMINI_API_KEY")  # Or put a placeholder key here for testing
+# Call the function directly
+logger.info("Calling process_image_and_prompt directly...")
+result = process_image_and_prompt(dummy_image, dummy_prompt, dummy_api_key)
 if result:
+    logger.info(f"Direct call successful. Result: {result}")
+    # result[0].show() # Uncomment to display image if running locally
 else:
+    logger.error("Direct call failed.")
+demo.launch(share=True) # gradio launch last