import json
import os
import time
import tempfile
from PIL import Image
import gradio as gr
import logging
from io import BytesIO

from google import genai
from google.genai import types

# .env 파일에 저장된 환경변수 로드 (python-dotenv 설치 필요: pip install python-dotenv)
from dotenv import load_dotenv
load_dotenv()

# 로깅 설정 (로그 레벨: DEBUG)
logging.basicConfig(level=logging.DEBUG,
                    format='%(asctime)s - %(levelname)s - %(message)s')
logger = logging.getLogger(__name__)


def save_binary_file(file_name, data):
    logger.debug(f"파일에 이진 데이터 저장 중: {file_name}")
    with open(file_name, "wb") as f:
        f.write(data)
    logger.debug(f"파일 저장 완료: {file_name}")


def merge_images(person_img_path, product_img_path, background_img_path, prompt, model="gemini-2.0-flash-exp-image-generation"):
    logger.debug(f"merge_images 함수 시작 - 프롬프트: '{prompt}'")
    
    try:
        # API 키는 환경변수에서 불러옴
        effective_api_key = os.environ.get("GEMINI_API_KEY")
        if effective_api_key:
            logger.debug("환경변수에서 API 키 불러옴")
        else:
            logger.error("API 키가 환경변수에 설정되지 않았습니다.")
            raise ValueError("API 키가 필요합니다.")

        client = genai.Client(api_key=effective_api_key)
        logger.debug("Gemini 클라이언트 초기화 완료.")

        # PIL 이미지 객체로 변환
        person_img = Image.open(person_img_path)
        product_img = Image.open(product_img_path)
        
        # 컨텐츠 리스트 생성
        contents = []
        
        # 사람 이미지 추가
        contents.append(
            types.Part.from_data(data=person_img, mime_type="image/jpeg")
        )
        
        # 상품 이미지 추가
        contents.append(
            types.Part.from_data(data=product_img, mime_type="image/jpeg")
        )
        
        # 배경 이미지가 있으면 추가
        if background_img_path:
            background_img = Image.open(background_img_path)
            contents.append(
                types.Part.from_data(data=background_img, mime_type="image/jpeg")
            )
            logger.debug("배경 이미지 추가됨")
        
        # 마지막에 프롬프트 추가
        contents.append(
            types.Part.from_text(text=prompt)
        )
        
        logger.debug(f"컨텐츠 객체 생성 완료: {len(contents)} 아이템")

        # 생성 설정
        generate_content_config = types.GenerateContentConfig(
            temperature=1,
            top_p=0.95,
            top_k=40,
            max_output_tokens=8192,
            response_modalities=["image", "text"],
        )
        logger.debug(f"생성 설정: {generate_content_config}")

        with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
            temp_path = tmp.name
            logger.debug(f"임시 파일 생성됨: {temp_path}")

            # 스트리밍 방식으로 데이터 수신 (원래 코드 방식으로 복원)
            response_stream = client.models.generate_content_stream(
                model=model,
                contents=[
                    types.Content(
                        role="user",
                        parts=contents,
                    ),
                ],
                config=generate_content_config,
            )
            
            logger.debug("응답 스트림 처리 시작...")
            
            # 응답에서 이미지와 텍스트 추출
            image_saved = False
            response_text = ""
            
            for chunk in response_stream:
                logger.debug(f"chunk 수신: {chunk}")
                
                # 응답 검증
                if not hasattr(chunk, 'candidates') or not chunk.candidates:
                    logger.warning("chunk에 candidates가 없습니다. 건너뜁니다.")
                    continue
                    
                if not hasattr(chunk.candidates[0], 'content') or not chunk.candidates[0].content:
                    logger.warning("chunk.candidates[0]에 content가 없습니다. 건너뜁니다.")
                    continue
                    
                if not hasattr(chunk.candidates[0].content, 'parts') or not chunk.candidates[0].content.parts:
                    logger.warning("chunk.candidates[0].content에 parts가 없습니다. 건너뜁니다.")
                    continue
                
                for part in chunk.candidates[0].content.parts:
                    if hasattr(part, 'text') and part.text:
                        response_text += part.text
                        logger.info(f"수신된 텍스트: {part.text}")
                    elif hasattr(part, 'inline_data') and part.inline_data:
                        save_binary_file(temp_path, part.inline_data.data)
                        logger.info(f"MIME 타입 {part.inline_data.mime_type}의 파일이 저장됨: {temp_path}")
                        image_saved = True

            if not image_saved:
                logger.warning("이미지가 생성되지 않았습니다.")
                return None, response_text or "이미지가 생성되지 않았습니다. 다른 프롬프트나 이미지로 시도해보세요."

        logger.debug("이미지 생성 완료.")
        return temp_path, response_text

    except Exception as e:
        logger.exception("이미지 생성 중 오류 발생:")
        return None, f"오류 발생: {str(e)}"  # 오류 발생 시 None과 오류 메시지 반환


def process_images_and_prompt(person_pil, product_pil, background_pil, prompt):
    logger.debug(f"process_images_and_prompt 함수 시작 - 프롬프트: '{prompt}'")
    try:
        # 필수 이미지 확인
        if person_pil is None:
            return [], "사람 이미지를 업로드해주세요."
        if product_pil is None:
            return [], "상품 이미지를 업로드해주세요."
            
        # 기본 프롬프트 설정 (비어있는 경우)
        if not prompt or not prompt.strip():
            if background_pil:
                prompt = "이 배경에 이 사람이 이 상품을 사용하는 모습을 자연스럽게 보여주세요. 상품을 잘 보이게 해주세요. Create a natural composite image showing this person using this product in this background setting. Make sure the product is clearly visible."
            else:
                prompt = "이 사람이 이 상품을 사용하는 모습을 자연스럽게 보여주세요. 상품을 잘 보이게 해주세요. Create a natural composite image showing this person using this product. Make sure the product is clearly visible."
        
        # 프롬프트에 영어가 없으면 영어 프롬프트 추가 (더 나은 결과를 위해)
        if not any(ord(c) < 128 for c in prompt):
            if background_pil:
                prompt += " Create a realistic composite image of this person with this product in this background."
            else:
                prompt += " Create a realistic composite image of this person with this product."
        
        # 이미지 저장
        with tempfile.NamedTemporaryFile(suffix=".jpg", delete=False) as tmp_person:
            person_path = tmp_person.name
            # RGB로 변환하여 저장
            person_img = person_pil
            if person_img.mode != 'RGB':
                person_img = person_img.convert('RGB')
            person_img.save(person_path, 'JPEG')
            logger.debug(f"사람 이미지 저장 완료: {person_path}")
            
        with tempfile.NamedTemporaryFile(suffix=".jpg", delete=False) as tmp_product:
            product_path = tmp_product.name
            # RGB로 변환하여 저장
            product_img = product_pil
            if product_img.mode != 'RGB':
                product_img = product_img.convert('RGB')
            product_img.save(product_path, 'JPEG')
            logger.debug(f"상품 이미지 저장 완료: {product_path}")
        
        # 배경 이미지 저장 (있는 경우)
        background_path = None
        if background_pil is not None:
            with tempfile.NamedTemporaryFile(suffix=".jpg", delete=False) as tmp_bg:
                background_path = tmp_bg.name
                # RGB로 변환하여 저장
                background_img = background_pil
                if background_img.mode != 'RGB':
                    background_img = background_img.convert('RGB')
                background_img.save(background_path, 'JPEG')
                logger.debug(f"배경 이미지 저장 완료: {background_path}")

        # 이미지 합성 실행
        result_path, response_text = merge_images(
            person_img_path=person_path,
            product_img_path=product_path,
            background_img_path=background_path,
            prompt=prompt
        )

        # 이미지 반환 및 임시 파일 정리
        if result_path:
            logger.debug(f"이미지 생성 완료. 경로: {result_path}")
            try:
                result_img = Image.open(result_path)
                if result_img.mode == "RGBA":
                    result_img = result_img.convert("RGB")
                
                # 임시 파일 정리
                try:
                    os.unlink(person_path)
                    os.unlink(product_path)
                    if background_path:
                        os.unlink(background_path)
                except Exception as e:
                    logger.warning(f"임시 파일 삭제 중 오류: {str(e)}")
                
                return [result_img], response_text or "이미지가 성공적으로 생성되었습니다."
            except Exception as e:
                logger.exception(f"결과 이미지 로드 중 오류: {str(e)}")
                return [], f"결과 이미지 처리 중 오류: {str(e)}"
        else:
            logger.error("merge_images 함수에서 None 반환됨.")
            return [], response_text or "이미지 생성에 실패했습니다. 다른 이미지나 프롬프트로 시도해보세요."

    except Exception as e:
        logger.exception("process_images_and_prompt 함수에서 오류 발생:")
        return [], f"오류 발생: {str(e)}"  # 오류 시 빈 리스트와 오류 메시지 반환


# --- Gradio 인터페이스 구성 ---
with gr.Blocks() as demo:
    gr.HTML(
        """
        <div style='display: flex; align-items: center; justify-content: center; gap: 20px'>
            <div style="background-color: var(--block-background-fill); border-radius: 8px">
                <img src="https://www.gstatic.com/lamda/images/gemini_favicon_f069958c85030456e93de685481c559f160ea06b.png" style="width: 100px; height: 100px;">
            </div>
            <div>
                <h1>Gemini를 이용한 이미지 합성</h1>
                <p>사람, 상품, 배경 이미지를 합성하는 애플리케이션입니다.</p>
            </div>
        </div>
        """
    )
    gr.Markdown("사람 이미지, 상품 이미지, 배경 이미지를 업로드하고, 어떻게 합성할지 설명해주세요.")

    with gr.Row():
        with gr.Column():
            person_input = gr.Image(type="pil", label="사람 이미지 (필수)", image_mode="RGB")
            product_input = gr.Image(type="pil", label="상품 이미지 (필수)", image_mode="RGB")
            background_input = gr.Image(type="pil", label="배경 이미지 (선택 사항)", image_mode="RGB")
            prompt_input = gr.Textbox(
                lines=2,
                placeholder="합성 방법을 설명해주세요. (예: '이 배경에서 이 사람이 상품을 사용하는 모습' 또는 '이 사람이 이 상품을 들고 이 배경에 서 있는 모습')",
                label="합성 방법 설명"
            )
            submit_btn = gr.Button("이미지 합성 실행")
        with gr.Column():
            output_gallery = gr.Gallery(label="합성 결과")
            output_text = gr.Textbox(label="AI 응답 텍스트", visible=True)

    submit_btn.click(
        fn=process_images_and_prompt,
        inputs=[person_input, product_input, background_input, prompt_input],
        outputs=[output_gallery, output_text],
    )

    gr.HTML("""
    <div style="margin-top: 20px; padding: 10px; background-color: #f8f9fa; border-radius: 8px;">
        <h3>사용 팁:</h3>
        <ul>
            <li><strong>배경 활용:</strong> "이 배경에서 이 사람이 이 상품을 사용하는 자연스러운 모습을 만들어주세요."</li>
            <li><strong>특정 위치 지정:</strong> "이 사람이 이 상품을 손에 들고 이 배경 앞에 서 있는 모습을 보여주세요."</li>
            <li><strong>상품 강조:</strong> "이 사람이 이 배경에서 이 상품을 사용하는 모습을 보여주되, 상품이 잘 보이도록 해주세요."</li>
            <li><strong>장면 설정:</strong> "이 사람이 이 상품으로 요리하는 모습을 이 주방 배경에서 보여주세요."</li>
            <li><strong>영어 프롬프트:</strong> 더 나은 결과를 위해 영어와 한국어를 함께 사용해 보세요.</li>
            <li><strong>배경 선택사항:</strong> 배경 이미지는 선택사항입니다. 배경 없이 사람과 상품만 합성할 수도 있습니다.</li>
        </ul>
    </div>
    """)

# --- 실행 ---
if __name__ == "__main__":
    demo.launch(share=True)