test-100

Running

App Files Files Community

test-100 / app.py

Kims12

Update app.py

5ff01f8 verified 5 months ago

raw

history blame

10.3 kB

	import json
	import os
	import time
	import tempfile
	from PIL import Image
	import gradio as gr
	import logging
	import io

	from google import genai
	from google.genai import types

	# .env 파일에 저장된 환경변수 로드 (python-dotenv 설치 필요: pip install python-dotenv)
	from dotenv import load_dotenv
	load_dotenv()

	# 로깅 설정 (로그 레벨: DEBUG)
	logging.basicConfig(level=logging.DEBUG,
	format='%(asctime)s - %(levelname)s - %(message)s')
	logger = logging.getLogger(__name__)


	def save_binary_file(file_name, data):
	logger.debug(f"파일에 이진 데이터 저장 중: {file_name}")
	with open(file_name, "wb") as f:
	f.write(data)
	logger.debug(f"파일 저장 완료: {file_name}")


	def generate_image_from_prompt(prompt, model="gemini-2.0-flash-exp-image-generation"):
	logger.debug(f"generate_image_from_prompt 함수 시작 - 프롬프트: '{prompt}'")

	try:
	# API 키는 환경변수에서 불러옴
	effective_api_key = os.environ.get("GEMINI_API_KEY")
	if effective_api_key:
	logger.debug("환경변수에서 API 키 불러옴")
	else:
	logger.error("API 키가 환경변수에 설정되지 않았습니다.")
	raise ValueError("API 키가 필요합니다.")

	client = genai.Client(api_key=effective_api_key)
	logger.debug("Gemini 클라이언트 초기화 완료.")

	# 프롬프트 처리
	if not prompt or not prompt.strip():
	prompt = "A creative and visually appealing image that captures imagination. Use vibrant colors and interesting composition."

	# 한국어 프롬프트에 영어 설명 추가
	if not any(ord(c) < 128 for c in prompt):
	prompt += " Create a highly detailed, visually stunning image that captures the essence of the description."

	# 컨텐츠 리스트 생성
	parts = [
	types.Part.from_text(text=prompt)
	]

	logger.debug(f"컨텐츠 객체 생성 완료: {len(parts)} 아이템")

	# 생성 설정
	generate_content_config = types.GenerateContentConfig(
	temperature=1,
	top_p=0.95,
	top_k=40,
	max_output_tokens=8192,
	response_modalities=["image", "text"],
	)
	logger.debug(f"생성 설정: {generate_content_config}")

	with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
	temp_path = tmp.name
	logger.debug(f"임시 파일 생성됨: {temp_path}")

	# 스트리밍 방식으로 데이터 수신
	response_stream = client.models.generate_content_stream(
	model=model,
	contents=[
	types.Content(
	role="user",
	parts=parts,
	),
	],
	config=generate_content_config,
	)

	logger.debug("응답 스트림 처리 시작...")

	# 응답에서 이미지와 텍스트 추출
	image_saved = False
	response_text = ""

	for chunk in response_stream:
	logger.debug(f"chunk 수신: {chunk}")

	# 응답 검증
	if not hasattr(chunk, 'candidates') or not chunk.candidates or len(chunk.candidates) == 0:
	logger.warning("chunk에 candidates가 없습니다. 건너뜁니다.")
	continue

	if not hasattr(chunk.candidates[0], 'content') or chunk.candidates[0].content is None:
	logger.warning("chunk.candidates[0]에 content가 없습니다. 건너뜁니다.")
	continue

	if not hasattr(chunk.candidates[0].content, 'parts') or not chunk.candidates[0].content.parts:
	logger.warning("chunk.candidates[0].content에 parts가 없습니다. 건너뜁니다.")
	continue

	for part in chunk.candidates[0].content.parts:
	if hasattr(part, 'text') and part.text:
	response_text += part.text
	logger.info(f"수신된 텍스트: {part.text}")
	elif hasattr(part, 'inline_data') and part.inline_data:
	save_binary_file(temp_path, part.inline_data.data)
	logger.info(f"MIME 타입 {part.inline_data.mime_type}의 파일이 저장됨: {temp_path}")
	image_saved = True

	if not image_saved:
	logger.warning("이미지가 생성되지 않았습니다.")
	return None, response_text or "이미지가 생성되지 않았습니다. 다른 프롬프트로 시도해보세요."

	logger.debug("이미지 생성 완료.")
	return temp_path, response_text

	except Exception as e:
	logger.exception("이미지 생성 중 오류 발생:")
	return None, f"오류 발생: {str(e)}" # 오류 발생 시 None과 오류 메시지 반환


	def process_image_generation(person_pil, product_pil, background_pil, prompt):
	logger.debug(f"process_image_generation 함수 시작 - 프롬프트: '{prompt}'")
	try:
	# 이미지들이 제공되었다면 기존 방식으로 처리
	if person_pil is not None or product_pil is not None or background_pil is not None:
	return process_images_and_prompt(person_pil, product_pil, background_pil, prompt)

	# 이미지 없이 프롬프트만 있는 경우
	result_path, response_text = generate_image_from_prompt(prompt)

	# 이미지 반환 및 처리
	if result_path:
	logger.debug(f"이미지 생성 완료. 경로: {result_path}")
	try:
	result_img = Image.open(result_path)
	if result_img.mode == "RGBA":
	result_img = result_img.convert("RGB")

	return [result_img], response_text or "이미지가 성공적으로 생성되었습니다."
	except Exception as e:
	logger.exception(f"결과 이미지 로드 중 오류: {str(e)}")
	return [], f"결과 이미지 처리 중 오류: {str(e)}"
	else:
	logger.error("generate_image_from_prompt 함수에서 None 반환됨.")
	return [], response_text or "이미지 생성에 실패했습니다. 다른 프롬프트로 시도해보세요."

	except Exception as e:
	logger.exception("process_image_generation 함수에서 오류 발생:")
	return [], f"오류 발생: {str(e)}" # 오류 시 빈 리스트와 오류 메시지 반환


	# --- Gradio 인터페이스 구성 (기존 코드는 동일하게 유지) ---
	with gr.Blocks() as demo:
	gr.HTML(
	"""
	<div style='display: flex; align-items: center; justify-content: center; gap: 20px'>
	<div style="background-color: var(--block-background-fill); border-radius: 8px">
	<img src="https://www.gstatic.com/lamda/images/gemini_favicon_f069958c85030456e93de685481c559f160ea06b.png" style="width: 100px; height: 100px;">
	</div>
	<div>
	<h1>Gemini를 이용한 이미지 생성</h1>
	<p>사람, 상품, 배경 이미지를 합성하거나 텍스트로 이미지를 생성할 수 있습니다.</p>
	</div>
	</div>
	"""
	)
	gr.Markdown("사람 이미지, 상품 이미지, 배경 이미지를 업로드하거나 텍스트로 이미지를 생성할 수 있습니다.")

	with gr.Row():
	with gr.Column():
	# 이미지 입력 섹션 (선택 사항)
	person_input = gr.Image(type="pil", label="사람 이미지 (선택 사항)", image_mode="RGB")
	product_input = gr.Image(type="pil", label="상품 이미지 (선택 사항)", image_mode="RGB")
	background_input = gr.Image(type="pil", label="배경 이미지 (선택 사항)", image_mode="RGB")

	# 프롬프트 입력 (필수)
	prompt_input = gr.Textbox(
	lines=3,
	placeholder="이미지 생성 설명을 입력해주세요. 예: '꽃밭에서 햇빛을 받으며 미소 짓는 젊은 여성', '현대적인 거실에서 고급 스마트폰을 사용하는 비즈니스맨'",
	label="이미지 생성 설명 (필수)"
	)
	submit_btn = gr.Button("이미지 생성")

	with gr.Column():
	output_gallery = gr.Gallery(label="생성된 이미지")
	output_text = gr.Textbox(label="AI 응답 텍스트", visible=True)

	submit_btn.click(
	fn=process_image_generation,
	inputs=[person_input, product_input, background_input, prompt_input],
	outputs=[output_gallery, output_text],
	)

	gr.HTML("""
	<div style="margin-top: 20px; padding: 10px; background-color: #f8f9fa; border-radius: 8px;">
	<h3>사용 방법:</h3>
	<ul>
	<li><strong>텍스트로 이미지 생성:</strong> 설명만 입력하고 이미지 생성 버튼을 누르세요.</li>
	<li><strong>이미지 합성:</strong> 사람, 상품, 배경 이미지를 선택적으로 업로드하고 합성 방법을 설명해주세요.</li>
	<li><strong>프롬프트 팁:</strong> 구체적이고 생생한 설명일수록 더 좋은 이미지가 생성됩니다.</li>
	<li><strong>예시 프롬프트:</strong>
	<ul>
	<li>한적한 카페에서 노트북으로 작업하는 크리에이터</li>
	<li>해변가에서 고급 선글라스를 끼고 포즈 취하는 모델</li>
	<li>현대적인 주방에서 최신 블렌더로 스무디를 만드는 요리사</li>
	</ul>
	</li>
	<li><strong>언어 팁:</strong> 한국어와 영어를 혼합해 사용하면 더 정확한 결과를 얻을 수 있습니다.</li>
	</ul>
	</div>
	""")

	# --- 실행 ---
	if __name__ == "__main__":
	demo.launch(share=True)