Update app.py
Browse files
app.py
CHANGED
@@ -4,8 +4,8 @@ from PIL import Image
|
|
4 |
import gradio as gr
|
5 |
import logging
|
6 |
import re
|
|
|
7 |
from io import BytesIO
|
8 |
-
import time
|
9 |
|
10 |
from google import genai
|
11 |
from google.genai import types
|
@@ -22,162 +22,111 @@ def save_binary_file(file_name, data):
|
|
22 |
with open(file_name, "wb") as f:
|
23 |
f.write(data)
|
24 |
|
25 |
-
def translate_prompt_to_english(prompt):
|
26 |
-
"""
|
27 |
-
์
๋ ฅ๋ ํ๋กฌํํธ์ ํ๊ธ์ด ํฌํจ๋์ด ์์ผ๋ฉด Geminiโ2.0โflash ๋ชจ๋ธ์ ์ฌ์ฉํ์ฌ ์์ด๋ก ๋ฒ์ญํฉ๋๋ค.
|
28 |
-
ํ๊ธ์ด ์์ผ๋ฉด ์๋ณธ ํ๋กฌํํธ๋ฅผ ๊ทธ๋๋ก ๋ฐํํฉ๋๋ค.
|
29 |
-
์ค์: #1, #2, #3 ํ๊ทธ๋ ๋ฒ์ญ ์ ํ์ ๋ฐ๋์ ๋ณด์กด๋์ด์ผ ํฉ๋๋ค.
|
30 |
-
"""
|
31 |
-
if not re.search("[๊ฐ-ํฃ]", prompt):
|
32 |
-
return prompt
|
33 |
-
|
34 |
-
# #1, #2, #3 ํ๊ทธ๋ฅผ ์์ ํ ํฐ์ผ๋ก ๋์ฒดํ์ฌ ๋ณด์กด
|
35 |
-
prompt = prompt.replace("#1", "IMAGE_TAG_ONE")
|
36 |
-
prompt = prompt.replace("#2", "IMAGE_TAG_TWO")
|
37 |
-
prompt = prompt.replace("#3", "IMAGE_TAG_THREE")
|
38 |
-
|
39 |
-
try:
|
40 |
-
api_key = os.environ.get("GEMINI_API_KEY")
|
41 |
-
if not api_key:
|
42 |
-
logger.error("Gemini API ํค๊ฐ ์ค์ ๋์ง ์์์ต๋๋ค.")
|
43 |
-
# ์์ ํ ํฐ์ ์๋ ํ๊ทธ๋ก ๋ณต์
|
44 |
-
prompt = prompt.replace("IMAGE_TAG_ONE", "#1")
|
45 |
-
prompt = prompt.replace("IMAGE_TAG_TWO", "#2")
|
46 |
-
prompt = prompt.replace("IMAGE_TAG_THREE", "#3")
|
47 |
-
return prompt
|
48 |
-
|
49 |
-
client = genai.Client(api_key=api_key)
|
50 |
-
translation_prompt = f"""
|
51 |
-
Translate the following Korean text to English:
|
52 |
-
|
53 |
-
{prompt}
|
54 |
-
|
55 |
-
IMPORTANT: The tokens IMAGE_TAG_ONE, IMAGE_TAG_TWO, and IMAGE_TAG_THREE are special tags
|
56 |
-
and must be preserved exactly as is in your translation. Do not translate these tokens.
|
57 |
-
"""
|
58 |
-
|
59 |
-
logger.info(f"Translation prompt: {translation_prompt}")
|
60 |
-
response = client.models.generate_content(
|
61 |
-
model="gemini-2.0-flash",
|
62 |
-
contents=[translation_prompt],
|
63 |
-
config=types.GenerateContentConfig(
|
64 |
-
response_modalities=['Text'],
|
65 |
-
temperature=0.2,
|
66 |
-
top_p=0.95,
|
67 |
-
top_k=40,
|
68 |
-
max_output_tokens=512
|
69 |
-
)
|
70 |
-
)
|
71 |
-
|
72 |
-
translated_text = ""
|
73 |
-
for part in response.candidates[0].content.parts:
|
74 |
-
if hasattr(part, 'text') and part.text:
|
75 |
-
translated_text += part.text
|
76 |
-
|
77 |
-
if translated_text.strip():
|
78 |
-
# ๋ฒ์ญ๋ ํ
์คํธ์์ ์์ ํ ํฐ์ ์๋ ํ๊ทธ๋ก ๋ณต์
|
79 |
-
translated_text = translated_text.replace("IMAGE_TAG_ONE", "#1")
|
80 |
-
translated_text = translated_text.replace("IMAGE_TAG_TWO", "#2")
|
81 |
-
translated_text = translated_text.replace("IMAGE_TAG_THREE", "#3")
|
82 |
-
logger.info(f"Translated text: {translated_text.strip()}")
|
83 |
-
return translated_text.strip()
|
84 |
-
else:
|
85 |
-
logger.warning("๋ฒ์ญ ๊ฒฐ๊ณผ๊ฐ ์์ต๋๋ค. ์๋ณธ ํ๋กฌํํธ ์ฌ์ฉ")
|
86 |
-
# ์์ ํ ํฐ์ ์๋ ํ๊ทธ๋ก ๋ณต์
|
87 |
-
prompt = prompt.replace("IMAGE_TAG_ONE", "#1")
|
88 |
-
prompt = prompt.replace("IMAGE_TAG_TWO", "#2")
|
89 |
-
prompt = prompt.replace("IMAGE_TAG_THREE", "#3")
|
90 |
-
return prompt
|
91 |
-
except Exception as e:
|
92 |
-
logger.exception("๋ฒ์ญ ์ค ์ค๋ฅ ๋ฐ์:")
|
93 |
-
# ์์ ํ ํฐ์ ์๋ ํ๊ทธ๋ก ๋ณต์
|
94 |
-
prompt = prompt.replace("IMAGE_TAG_ONE", "#1")
|
95 |
-
prompt = prompt.replace("IMAGE_TAG_TWO", "#2")
|
96 |
-
prompt = prompt.replace("IMAGE_TAG_THREE", "#3")
|
97 |
-
return prompt
|
98 |
-
|
99 |
def preprocess_prompt(prompt, image1, image2, image3):
|
100 |
"""
|
101 |
ํ๋กฌํํธ๋ฅผ ์ฒ๋ฆฌํ๊ณ ๊ธฐ๋ฅ ๋ช
๋ น์ ํด์
|
102 |
"""
|
|
|
|
|
103 |
has_img1 = image1 is not None
|
104 |
has_img2 = image2 is not None
|
105 |
has_img3 = image3 is not None
|
106 |
-
|
|
|
107 |
if "#1" in prompt and not has_img1:
|
108 |
prompt = prompt.replace("#1", "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง(์์)")
|
109 |
else:
|
110 |
prompt = prompt.replace("#1", "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง")
|
111 |
-
|
112 |
if "#2" in prompt and not has_img2:
|
113 |
prompt = prompt.replace("#2", "๋ ๋ฒ์งธ ์ด๋ฏธ์ง(์์)")
|
114 |
else:
|
115 |
prompt = prompt.replace("#2", "๋ ๋ฒ์งธ ์ด๋ฏธ์ง")
|
116 |
-
|
117 |
if "#3" in prompt and not has_img3:
|
118 |
prompt = prompt.replace("#3", "์ธ ๋ฒ์งธ ์ด๋ฏธ์ง(์์)")
|
119 |
else:
|
120 |
prompt = prompt.replace("#3", "์ธ ๋ฒ์งธ ์ด๋ฏธ์ง")
|
121 |
-
|
|
|
122 |
if "1. ์ด๋ฏธ์ง ๋ณ๊ฒฝ" in prompt:
|
|
|
123 |
desc_match = re.search(r'#1์ "(.*?)"์ผ๋ก ๋ฐ๊ฟ๋ผ', prompt)
|
124 |
if desc_match:
|
125 |
description = desc_match.group(1)
|
126 |
prompt = f"์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง๋ฅผ {description}์ผ๋ก ๋ณ๊ฒฝํด์ฃผ์ธ์. ์๋ณธ ์ด๋ฏธ์ง์ ์ฃผ์ ๋ด์ฉ์ ์ ์งํ๋ ์๋ก์ด ๏ฟฝ๏ฟฝํ์ผ๊ณผ ๋ถ์๊ธฐ๋ก ์ฌํด์ํด์ฃผ์ธ์."
|
127 |
else:
|
128 |
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง๋ฅผ ์ฐฝ์์ ์ผ๋ก ๋ณํํด์ฃผ์ธ์. ๋ ์์ํ๊ณ ์์ ์ ์ธ ๋ฒ์ ์ผ๋ก ๋ง๋ค์ด์ฃผ์ธ์."
|
129 |
-
|
130 |
elif "2. ๊ธ์์ง์ฐ๊ธฐ" in prompt:
|
|
|
131 |
text_match = re.search(r'#1์์ "(.*?)"๋ฅผ ์ง์๋ผ', prompt)
|
132 |
if text_match:
|
133 |
text_to_remove = text_match.group(1)
|
134 |
prompt = f"์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์์ '{text_to_remove}' ํ
์คํธ๋ฅผ ์ฐพ์ ์์ฐ์ค๋ฝ๊ฒ ์ ๊ฑฐํด์ฃผ์ธ์. ํ
์คํธ๊ฐ ์๋ ๋ถ๋ถ์ ๋ฐฐ๊ฒฝ๊ณผ ์กฐํ๋กญ๊ฒ ์ฑ์์ฃผ์ธ์."
|
135 |
else:
|
136 |
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์์ ๋ชจ๋ ํ
์คํธ๋ฅผ ์ฐพ์ ์์ฐ์ค๋ฝ๊ฒ ์ ๊ฑฐํด์ฃผ์ธ์. ๊น๋ํ ์ด๋ฏธ์ง๋ก ๋ง๋ค์ด์ฃผ์ธ์."
|
137 |
-
|
|
|
|
|
|
|
138 |
elif "4. ์ท๋ฐ๊พธ๊ธฐ" in prompt:
|
139 |
-
|
140 |
-
|
|
|
|
|
|
|
|
|
141 |
elif "5. ๋ฐฐ๊ฒฝ๋ฐ๊พธ๊ธฐ" in prompt:
|
142 |
-
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์ ๋ฐฐ๊ฒฝ์ ๋ ๋ฒ์งธ ์ด๋ฏธ์ง์ ๋ฐฐ๊ฒฝ์ผ๋ก
|
143 |
-
|
144 |
elif "6. ์ด๋ฏธ์ง ํฉ์ฑ(์ํํฌํจ)" in prompt:
|
145 |
-
|
146 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
147 |
prompt += " ์ด๋ฏธ์ง๋ฅผ ์์ฑํด์ฃผ์ธ์."
|
|
|
148 |
return prompt
|
149 |
|
150 |
-
def generate_with_images(prompt, images
|
151 |
"""
|
152 |
-
|
153 |
-
variation_index๋ก ๋ค์ํ ๋ณํ๋ฅผ ์ค๋๋ค.
|
154 |
-
์์ฑ๋ ์ด๋ฏธ์ง๋ ์ผ๊ด๋ ํฌ๊ธฐ๋ก ์กฐ์ ๋ฉ๋๋ค.
|
155 |
"""
|
156 |
try:
|
|
|
157 |
api_key = os.environ.get("GEMINI_API_KEY")
|
158 |
if not api_key:
|
159 |
return None, "API ํค๊ฐ ์ค์ ๋์ง ์์์ต๋๋ค. ํ๊ฒฝ๋ณ์๋ฅผ ํ์ธํด์ฃผ์ธ์."
|
160 |
-
|
|
|
161 |
client = genai.Client(api_key=api_key)
|
162 |
-
logger.info(f"Gemini API ์์ฒญ ์์ - ํ๋กฌํํธ: {prompt}, ๋ณํ ์ธ๋ฑ์ค: {variation_index}")
|
163 |
-
|
164 |
-
# ๋ณํ ์ธ๋ฑ์ค์ ๋ฐ๋ผ ํ๋กฌํํธ์ ์ฝ๊ฐ์ ๋ณํ ์ถ๊ฐ
|
165 |
-
variation_suffixes = [
|
166 |
-
" ์ฒซ ๋ฒ์งธ ๋ณํ์ผ๋ก ๋ง๋ค์ด์ฃผ์ธ์.",
|
167 |
-
" ๋ ๋ฒ์งธ ๋ณํ์ผ๋ก ๋ ์์ํ๊ฒ ๋ง๋ค์ด์ฃผ์ธ์.",
|
168 |
-
" ์ธ ๋ฒ์งธ ๋ณํ์ผ๋ก ๋ ์ฐฝ์์ ์ผ๋ก ๋ง๋ค์ด์ฃผ์ธ์.",
|
169 |
-
" ๋ค ๋ฒ์งธ ๋ณํ์ผ๋ก ์๊ฐ์ ๋ ๊ฐ์กฐํด์ ๋ง๋ค์ด์ฃผ์ธ์."
|
170 |
-
]
|
171 |
|
172 |
-
|
173 |
-
|
174 |
-
|
175 |
-
contents = [
|
|
|
|
|
|
|
|
|
|
|
176 |
for idx, img in enumerate(images, 1):
|
177 |
if img is not None:
|
178 |
contents.append(img)
|
179 |
logger.info(f"์ด๋ฏธ์ง #{idx} ์ถ๊ฐ๋จ")
|
180 |
-
|
|
|
181 |
response = client.models.generate_content(
|
182 |
model="gemini-2.0-flash-exp-image-generation",
|
183 |
contents=contents,
|
@@ -189,11 +138,15 @@ def generate_with_images(prompt, images, variation_index=0):
|
|
189 |
max_output_tokens=8192
|
190 |
)
|
191 |
)
|
192 |
-
|
|
|
193 |
with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
|
194 |
temp_path = tmp.name
|
|
|
195 |
result_text = ""
|
196 |
image_found = False
|
|
|
|
|
197 |
for part in response.candidates[0].content.parts:
|
198 |
if hasattr(part, 'text') and part.text:
|
199 |
result_text += part.text
|
@@ -202,210 +155,183 @@ def generate_with_images(prompt, images, variation_index=0):
|
|
202 |
save_binary_file(temp_path, part.inline_data.data)
|
203 |
image_found = True
|
204 |
logger.info("์๋ต์์ ์ด๋ฏธ์ง ์ถ์ถ ์ฑ๊ณต")
|
|
|
205 |
if not image_found:
|
206 |
return None, f"API์์ ์ด๋ฏธ์ง๋ฅผ ์์ฑํ์ง ๋ชปํ์ต๋๋ค. ์๋ต ํ
์คํธ: {result_text}"
|
|
|
|
|
207 |
result_img = Image.open(temp_path)
|
208 |
if result_img.mode == "RGBA":
|
209 |
result_img = result_img.convert("RGB")
|
210 |
|
211 |
-
# ์ด๋ฏธ์ง ํฌ๊ธฐ๋ฅผ 512x512๋ก ์กฐ์ ํ์ฌ ์ผ๊ด๋ ์ถ๋ ฅ ํฌ๊ธฐ ์ ์ง
|
212 |
-
target_size = (512, 512)
|
213 |
-
result_img = result_img.resize(target_size, Image.Resampling.LANCZOS)
|
214 |
-
|
215 |
return result_img, f"์ด๋ฏธ์ง๊ฐ ์ฑ๊ณต์ ์ผ๋ก ์์ฑ๋์์ต๋๋ค. {result_text}"
|
|
|
216 |
except Exception as e:
|
217 |
logger.exception("์ด๋ฏธ์ง ์์ฑ ์ค ์ค๋ฅ ๋ฐ์:")
|
218 |
return None, f"์ค๋ฅ ๋ฐ์: {str(e)}"
|
219 |
|
220 |
-
def process_images_with_prompt(image1, image2, image3, prompt
|
221 |
"""
|
222 |
-
3๊ฐ์ ์ด๋ฏธ์ง์ ํ๋กฌํํธ๋ฅผ
|
223 |
-
API๋ฅผ ํธ์ถํ์ฌ ๊ฒฐ๊ณผ ์ด๋ฏธ์ง๋ฅผ ๋ฐํํฉ๋๋ค.
|
224 |
"""
|
225 |
try:
|
|
|
226 |
images = [image1, image2, image3]
|
227 |
valid_images = [img for img in images if img is not None]
|
|
|
228 |
if not valid_images:
|
229 |
-
return None, "์ ์ด๋ ํ๋์ ์ด๋ฏธ์ง๋ฅผ ์
๋ก๋ํด์ฃผ์ธ์."
|
230 |
-
|
231 |
-
|
232 |
-
|
233 |
-
|
234 |
-
final_prompt = translate_prompt_to_english(processed_prompt)
|
235 |
-
else:
|
236 |
-
final_prompt = processed_prompt
|
237 |
-
else:
|
238 |
if len(valid_images) == 1:
|
239 |
-
|
240 |
-
logger.info("
|
241 |
elif len(valid_images) == 2:
|
242 |
-
|
243 |
-
logger.info("
|
244 |
else:
|
245 |
-
|
246 |
-
logger.info("
|
247 |
-
|
248 |
-
|
249 |
-
|
|
|
|
|
|
|
|
|
250 |
except Exception as e:
|
251 |
logger.exception("์ด๋ฏธ์ง ์ฒ๋ฆฌ ์ค ์ค๋ฅ ๋ฐ์:")
|
252 |
-
return None, f"์ค๋ฅ ๋ฐ์: {str(e)}"
|
253 |
|
254 |
-
|
255 |
-
|
256 |
-
|
257 |
-
|
258 |
-
|
259 |
-
|
260 |
-
|
|
|
|
|
|
|
|
|
261 |
|
262 |
-
|
263 |
-
|
264 |
-
progress(0, desc="์ด๋ฏธ์ง ์์ฑ ์ค๋น ์ค...")
|
265 |
-
|
266 |
-
for i in range(num_images):
|
267 |
-
progress((i / num_images), desc=f"{i+1}/{num_images} ์ด๋ฏธ์ง ์์ฑ ์ค...")
|
268 |
-
result_img, status, final_prompt = process_images_with_prompt(image1, image2, image3, prompt, i)
|
269 |
-
|
270 |
-
if result_img is not None:
|
271 |
-
results.append(result_img)
|
272 |
-
statuses.append(f"์ด๋ฏธ์ง #{i+1}: {status}")
|
273 |
-
prompts.append(f"์ด๋ฏธ์ง #{i+1}: {final_prompt}")
|
274 |
-
else:
|
275 |
-
# ์๋ฌ๊ฐ ๋ฐ์ํ ๊ฒฝ์ฐ์๋ ๊ฒฐ๊ณผ ๋ชฉ๋ก์ None์ ์ถ๊ฐ
|
276 |
-
results.append(None)
|
277 |
-
statuses.append(f"์ด๋ฏธ์ง #{i+1} ์์ฑ ์คํจ: {status}")
|
278 |
-
prompts.append(f"์ด๋ฏธ์ง #{i+1}: {final_prompt}")
|
279 |
-
|
280 |
-
# API ํธ์ถ ์ฌ์ด์ ์ฝ๊ฐ์ ๊ฐ๊ฒฉ์ ๋์ด ์๋ ์ ํ ๋ฐฉ์ง
|
281 |
-
time.sleep(1)
|
282 |
-
|
283 |
-
progress(1.0, desc="์ด๋ฏธ์ง ์์ฑ ์๋ฃ!")
|
284 |
-
|
285 |
-
# ๊ฒฐ๊ณผ๊ฐ ์๋ ๊ฒฝ์ฐ ๋น ์ฌ๋กฏ ์ฑ์ฐ๊ธฐ
|
286 |
-
while len(results) < 4:
|
287 |
-
results.append(None)
|
288 |
-
|
289 |
-
# ์ํ ๋ฉ์์ง์ ํ๋กฌํํธ ์ ๋ณด ๊ฒฐํฉ
|
290 |
-
combined_status = "\n".join(statuses)
|
291 |
-
combined_prompts = "\n".join(prompts)
|
292 |
-
|
293 |
-
return results[0], results[1], results[2], results[3], combined_status, combined_prompts
|
294 |
|
295 |
-
# Gradio ์ธํฐํ์ด์ค
|
296 |
-
with gr.Blocks(
|
297 |
-
.
|
298 |
-
|
299 |
-
|
300 |
-
|
301 |
-
|
302 |
-
|
303 |
-
|
304 |
-
|
305 |
-
|
306 |
-
|
307 |
-
<h1 style="margin-bottom: 0.5rem;">4์ฅ ์ด๋ฏธ์ง ์์ฑ๊ธฐ</h1>
|
308 |
-
<p style="margin-bottom: 0.2rem;">์ด๋ฏธ์ง๋ฅผ ์
๋ก๋ํ๊ณ "์ด๋ฏธ์ง ์์ฑ" ๋ฒํผ์ ํด๋ฆญํ๋ฉด</p>
|
309 |
-
<p>์ฐจ๋ก๋ก 4์ฅ์ ์ด๋ฏธ์ง๊ฐ ์์ฑ๋ฉ๋๋ค.</p>
|
310 |
-
</div>
|
311 |
-
"""
|
312 |
-
)
|
313 |
-
|
314 |
-
# ์
๋ ฅ ์น์
|
315 |
-
gr.HTML("<h3 style='text-align: center; margin-top: 1rem; margin-bottom: 0.5rem;'>์
๋ ฅ ์ด๋ฏธ์ง</h3>")
|
316 |
-
|
317 |
-
# ์
๋ ฅ ์ด๋ฏธ์ง UI๋ฅผ ์ ์ ํ ๊ฐ๊ฒฉ์ผ๋ก ์ธ๋ก ๋ฐฐ์น
|
318 |
with gr.Column():
|
|
|
319 |
with gr.Row():
|
320 |
-
image1_input = gr.Image(type="pil", label="#1",
|
321 |
-
image2_input = gr.Image(type="pil", label="#2",
|
322 |
-
|
323 |
-
|
324 |
-
|
325 |
-
|
326 |
-
# ํ๋กฌํํธ ์
๋ ฅ
|
327 |
-
prompt_input = gr.Textbox(
|
328 |
-
lines=3,
|
329 |
-
placeholder="ํ๋กฌํํธ๋ฅผ ์
๋ ฅํ๊ฑฐ๋ ๋น์๋๋ฉด ์๋ ํฉ์ฑ๋ฉ๋๋ค.",
|
330 |
-
label="ํ๋กฌํํธ (์ ํ ์ฌํญ)"
|
331 |
-
)
|
332 |
-
|
333 |
-
# ๋ฒํผ ์คํ์ผ ๊ฐ์
|
334 |
-
with gr.Column(variant="panel"):
|
335 |
-
gr.HTML("<h4 style='margin-bottom: 0.5rem; text-align: center; width: 100%;'>์์
์ ํ</h4>")
|
336 |
with gr.Row():
|
337 |
-
|
338 |
-
|
339 |
-
|
340 |
-
|
341 |
-
|
342 |
-
|
343 |
-
|
344 |
-
|
345 |
-
|
346 |
-
|
347 |
-
|
348 |
-
|
349 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
350 |
|
351 |
-
# ์ถ๋ ฅ ์ด๋ฏธ์ง UI๋ฅผ ์ธ๋ก๋ก ๋ฐฐ์น
|
352 |
with gr.Column():
|
353 |
-
|
354 |
-
|
355 |
-
|
356 |
-
|
357 |
-
|
358 |
-
|
359 |
-
|
360 |
-
# ์ํ ๋ฐ ํ๋กฌํํธ ์ ๋ณด
|
361 |
-
output_text = gr.Textbox(label="์ํ ๋ฉ์์ง")
|
362 |
-
prompt_display = gr.Textbox(label="์ฌ์ฉ๋ ํ๋กฌํํธ (์์ด)", visible=True)
|
363 |
|
364 |
-
#
|
365 |
-
|
366 |
-
fn=
|
367 |
-
inputs=[],
|
368 |
-
outputs=prompt_input
|
369 |
-
)
|
370 |
-
text_remove_btn.click(
|
371 |
-
fn=lambda: "(#1 ์ด๋ฏธ์ง)์ ์๋ ์ค๊ตญ์ด๋ฅผ ๋ชจ๋ ์ ๊ฑฐํ๋ผ.",
|
372 |
-
inputs=[],
|
373 |
-
outputs=prompt_input
|
374 |
-
)
|
375 |
-
clothes_change_btn.click(
|
376 |
-
fn=lambda: "(#1์ ์ฌ์ฑ๋ชจ๋ธ)์ด ์ ์ฒด ๋น์ก๊ณผ ํฌ์ฆ๋ ์ ์นํ ์ฒด (#2์ ์ ๊ธ๋ผ์ค)์ (#3์ ์ฒญ๋ฐ์ง)๋ฅผ ์ง์ ๋ชจ๋ธ์ด ์ฐฉ์ฉํ๊ฒ ์ฒ๋ผ ์์ฐ์ค๋ฝ๊ฒ ์ด๋ฏธ์ง๋ฅผ ์์ฑํ๋ผ.",
|
377 |
-
inputs=[],
|
378 |
-
outputs=prompt_input
|
379 |
-
)
|
380 |
-
background_change_btn.click(
|
381 |
-
fn=lambda: "(#1์ ์ฌ์ฑ๋ชจ๋ธ)์ด (#2 ์ด๋ฏธ์ง์ ๋ฐฐ๊ฒฝ)์ ์ฃผ์ ํผ์ฌ์ฒด๋ ๊ทธ๋๋ก ์ ์งํ์ฌ ๋ ์ด๋ฏธ์ง์ ๋ถ์๊ธฐ๊ฐ ์์ฐ์ค๋ฝ๊ฒ ์ด์ฐ๋ฌ์ง๋๋ก ์์ฑํ๋ผ.",
|
382 |
-
inputs=[],
|
383 |
-
outputs=prompt_input
|
384 |
-
)
|
385 |
-
composite_product_btn.click(
|
386 |
-
fn=lambda: "#1 ์ด๋ฏธ์ง์์ [์ ๊ฑฐํ ์์ญ ๋๋ ๋์์ ์์ธํ ์์ฑํด์ฃผ์ธ์]์ ์ ๊ฑฐํ ํ, ๊ทธ ์๋ฆฌ๋ฅผ ์ฃผ๋ณ ๋ฐฐ๊ฒฝ๊ณผ ์์ฐ์ค๋ฝ๊ฒ ์ด์ฐ๋ฌ์ง๋๋ก ์ฑ์์ฃผ์ธ์. ๋จ, ์ด๋ฏธ์ง์ ์ฃผ์ ์์์ ์ ์ฒด ๋ถ์๊ธฐ๋ ๋์ผํ๊ฒ ์ ์งํด ์ฃผ์ธ์.",
|
387 |
-
inputs=[],
|
388 |
-
outputs=prompt_input
|
389 |
)
|
390 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
391 |
submit_btn.click(
|
392 |
-
fn=
|
393 |
inputs=[image1_input, image2_input, image3_input, prompt_input],
|
394 |
-
outputs=[
|
395 |
)
|
396 |
-
|
397 |
gr.Markdown(
|
398 |
"""
|
399 |
### ์ฌ์ฉ ๋ฐฉ๋ฒ:
|
400 |
|
401 |
-
1. **์๋ ํฉ์ฑ**:
|
402 |
-
2.
|
403 |
-
3.
|
404 |
-
4.
|
|
|
405 |
|
406 |
-
> **ํ**: ํ๋กฌํํธ๋ฅผ ์ง์ ์์ ํ
|
407 |
"""
|
408 |
)
|
409 |
|
|
|
410 |
if __name__ == "__main__":
|
411 |
demo.launch(share=True)
|
|
|
4 |
import gradio as gr
|
5 |
import logging
|
6 |
import re
|
7 |
+
import io
|
8 |
from io import BytesIO
|
|
|
9 |
|
10 |
from google import genai
|
11 |
from google.genai import types
|
|
|
22 |
with open(file_name, "wb") as f:
|
23 |
f.write(data)
|
24 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
25 |
def preprocess_prompt(prompt, image1, image2, image3):
|
26 |
"""
|
27 |
ํ๋กฌํํธ๋ฅผ ์ฒ๋ฆฌํ๊ณ ๊ธฐ๋ฅ ๋ช
๋ น์ ํด์
|
28 |
"""
|
29 |
+
# ๊ธฐ์กด preprocess_prompt ํจ์ ์ฝ๋ ์ ์ง
|
30 |
+
# ์ด๋ฏธ์ง ์๋ ์ฐธ์กฐ ํ์ธ ๋ฐ ์ฒ๋ฆฌ
|
31 |
has_img1 = image1 is not None
|
32 |
has_img2 = image2 is not None
|
33 |
has_img3 = image3 is not None
|
34 |
+
|
35 |
+
# #1, #2, #3 ์ฐธ์กฐ๋ฅผ ์ค๋ช
์ผ๋ก ๋ณํ (์ด๋ฏธ์ง๊ฐ ์๋ ๊ฒฝ์ฐ ๋ฌด์)
|
36 |
if "#1" in prompt and not has_img1:
|
37 |
prompt = prompt.replace("#1", "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง(์์)")
|
38 |
else:
|
39 |
prompt = prompt.replace("#1", "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง")
|
40 |
+
|
41 |
if "#2" in prompt and not has_img2:
|
42 |
prompt = prompt.replace("#2", "๋ ๋ฒ์งธ ์ด๋ฏธ์ง(์์)")
|
43 |
else:
|
44 |
prompt = prompt.replace("#2", "๋ ๋ฒ์งธ ์ด๋ฏธ์ง")
|
45 |
+
|
46 |
if "#3" in prompt and not has_img3:
|
47 |
prompt = prompt.replace("#3", "์ธ ๋ฒ์งธ ์ด๋ฏธ์ง(์์)")
|
48 |
else:
|
49 |
prompt = prompt.replace("#3", "์ธ ๋ฒ์งธ ์ด๋ฏธ์ง")
|
50 |
+
|
51 |
+
# ๊ธฐ๋ฅ ๋ช
๋ น ํด์
|
52 |
if "1. ์ด๋ฏธ์ง ๋ณ๊ฒฝ" in prompt:
|
53 |
+
# ์ค๋ช
์ถ์ถ์ ์๋ํ์ง๋ง ์คํจํด๋ ๊ธฐ๋ณธ ํ๋กฌํํธ ์ ๊ณต
|
54 |
desc_match = re.search(r'#1์ "(.*?)"์ผ๋ก ๋ฐ๊ฟ๋ผ', prompt)
|
55 |
if desc_match:
|
56 |
description = desc_match.group(1)
|
57 |
prompt = f"์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง๋ฅผ {description}์ผ๋ก ๋ณ๊ฒฝํด์ฃผ์ธ์. ์๋ณธ ์ด๋ฏธ์ง์ ์ฃผ์ ๋ด์ฉ์ ์ ์งํ๋ ์๋ก์ด ๏ฟฝ๏ฟฝํ์ผ๊ณผ ๋ถ์๊ธฐ๋ก ์ฌํด์ํด์ฃผ์ธ์."
|
58 |
else:
|
59 |
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง๋ฅผ ์ฐฝ์์ ์ผ๋ก ๋ณํํด์ฃผ์ธ์. ๋ ์์ํ๊ณ ์์ ์ ์ธ ๋ฒ์ ์ผ๋ก ๋ง๋ค์ด์ฃผ์ธ์."
|
60 |
+
|
61 |
elif "2. ๊ธ์์ง์ฐ๊ธฐ" in prompt:
|
62 |
+
# ์ง์ธ ํ
์คํธ ์ถ์ถ์ ์๋ํ์ง๋ง ์คํจํด๋ ๊ธฐ๋ณธ ํ๋กฌํํธ ์ ๊ณต
|
63 |
text_match = re.search(r'#1์์ "(.*?)"๋ฅผ ์ง์๋ผ', prompt)
|
64 |
if text_match:
|
65 |
text_to_remove = text_match.group(1)
|
66 |
prompt = f"์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์์ '{text_to_remove}' ํ
์คํธ๋ฅผ ์ฐพ์ ์์ฐ์ค๋ฝ๊ฒ ์ ๊ฑฐํด์ฃผ์ธ์. ํ
์คํธ๊ฐ ์๋ ๋ถ๋ถ์ ๋ฐฐ๊ฒฝ๊ณผ ์กฐํ๋กญ๊ฒ ์ฑ์์ฃผ์ธ์."
|
67 |
else:
|
68 |
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์์ ๋ชจ๋ ํ
์คํธ๋ฅผ ์ฐพ์ ์์ฐ์ค๋ฝ๊ฒ ์ ๊ฑฐํด์ฃผ์ธ์. ๊น๋ํ ์ด๋ฏธ์ง๋ก ๋ง๋ค์ด์ฃผ์ธ์."
|
69 |
+
|
70 |
+
elif "3. ์ผ๊ตด๋ฐ๊พธ๊ธฐ" in prompt:
|
71 |
+
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์ ์ธ๋ฌผ ์ผ๊ตด์ ๋ ๋ฒ์งธ ์ด๋ฏธ์ง์ ์ผ๊ตด๋ก ์์ฐ์ค๋ฝ๊ฒ ๊ต์ฒดํด์ฃผ์ธ์. ์ผ๊ตด์ ํ์ ๊ณผ ํน์ง์ ๋ ๋ฒ์งธ ์ด๋ฏธ์ง๋ฅผ ๋ฐ๋ฅด๋, ๋๋จธ์ง ๋ถ๋ถ์ ์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง๋ฅผ ์ ์งํด์ฃผ์ธ์."
|
72 |
+
|
73 |
elif "4. ์ท๋ฐ๊พธ๊ธฐ" in prompt:
|
74 |
+
# ์ฌ๋ฌ ์ด๋ฏธ์ง ์ฐธ์กฐ ์ฒ๋ฆฌ
|
75 |
+
if "#3" in prompt or "๋๋ #3" in prompt:
|
76 |
+
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์ ์ธ๋ฌผ ์์์ ๋ ๋ฒ์งธ ๋๋ ์ธ ๋ฒ์งธ ์ด๋ฏธ์ง์ ์์์ผ๋ก ์์ฐ์ค๋ฝ๊ฒ ๊ต์ฒดํด์ฃผ์ธ์. ์์์ ์คํ์ผ๊ณผ ์์์ ์ฐธ์กฐ ์ด๋ฏธ์ง๋ฅผ ๋ฐ๋ฅด๋, ์ ์ฒด ๋น์จ๊ณผ ํฌ์ฆ๋ ์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง๋ฅผ ์ ์งํด์ฃผ์ธ์."
|
77 |
+
else:
|
78 |
+
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์ ์ธ๋ฌผ ์์์ ๋ ๋ฒ์งธ ์ด๋ฏธ์ง์ ์์์ผ๋ก ์์ฐ์ค๋ฝ๊ฒ ๊ต์ฒดํด์ฃผ์ธ์. ์์์ ์คํ์ผ๊ณผ ์์์ ๋ ๋ฒ์งธ ์ด๋ฏธ์ง๋ฅผ ๋ฐ๋ฅด๋, ์ ์ฒด ๋น์จ๊ณผ ํฌ์ฆ๋ ์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง๋ฅผ ์ ์งํด์ฃผ์ธ์."
|
79 |
+
|
80 |
elif "5. ๋ฐฐ๊ฒฝ๋ฐ๊พธ๊ธฐ" in prompt:
|
81 |
+
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์ ๋ฐฐ๊ฒฝ์ ๋ ๋ฒ์งธ ์ด๋ฏธ์ง์ ๋ฐฐ๊ฒฝ์ผ๋ก ์์ฐ์ค๋ฝ๊ฒ ๊ต์ฒดํด์ฃผ์ธ์. ์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์ ์ฃผ์ ํผ์ฌ์ฒด๋ ์ ์งํ๊ณ , ๋ ๋ฒ์งธ ์ด๋ฏธ์ง์ ๋ฐฐ๊ฒฝ๊ณผ ์กฐํ๋กญ๊ฒ ํฉ์ฑํด์ฃผ์ธ์."
|
82 |
+
|
83 |
elif "6. ์ด๋ฏธ์ง ํฉ์ฑ(์ํํฌํจ)" in prompt:
|
84 |
+
# ์ฌ๋ฌ ์ด๋ฏธ์ง ์ฐธ์กฐ ์ฒ๋ฆฌ
|
85 |
+
if "#3" in prompt or "๋๋ #3" in prompt:
|
86 |
+
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์ ๋ ๋ฒ์งธ, ์ธ ๋ฒ์งธ ์ด๋ฏธ์ง๋ฅผ ์์ฐ์ค๋ฝ๊ฒ ํฉ์ฑํด์ฃผ์ธ์. ๋ชจ๋ ์ด๋ฏธ์ง์ ์ฃผ์ ์์๋ฅผ ํฌํจํ๊ณ , ํนํ ์ํ์ด ์ ๋ณด์ด๋๋ก ์กฐํ๋กญ๊ฒ ํตํฉํด์ฃผ์ธ์."
|
87 |
+
else:
|
88 |
+
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์ ๋ ๋ฒ์งธ ์ด๋ฏธ์ง๋ฅผ ์์ฐ์ค๋ฝ๊ฒ ํฉ์ฑํด์ฃผ์ธ์. ๋ ์ด๋ฏธ์ง์ ์ฃผ์ ์์๋ฅผ ํฌํจํ๊ณ , ํนํ ์ํ์ด ์ ๋ณด์ด๋๋ก ์กฐํ๋กญ๊ฒ ํตํฉํด์ฃผ์ธ์."
|
89 |
+
|
90 |
+
elif "7. ์ด๋ฏธ์ง ํฉ์ฑ(์คํ์ผ์ ์ฉ)" in prompt:
|
91 |
+
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์ ๋ด์ฉ์ ๋ ๋ฒ์งธ ์ด๋ฏธ์ง์ ์คํ์ผ๋ก ๋ณํํด์ฃผ์ธ์. ์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง์ ์ฃผ์ ํผ์ฌ์ฒด์ ๊ตฌ๋๋ ์ ์งํ๋, ๋ ๋ฒ์งธ ์ด๋ฏธ์ง์ ์์ ์ ์คํ์ผ, ์์, ์ง๊ฐ์ ์ ์ฉํด์ฃผ์ธ์."
|
92 |
+
|
93 |
+
# ๊ฐ๋จํ ์์ ๋ณ๊ฒฝ ์์ฒญ ์ฒ๋ฆฌ
|
94 |
+
elif "์ ๋ถ์์์ผ๋ก ๋ฐ๊ฟ๋ผ" in prompt or "๋ฅผ ๋ถ์์์ผ๋ก ๋ฐ๊ฟ๋ผ" in prompt:
|
95 |
+
prompt = "์ฒซ ๋ฒ์งธ ์ด๋ฏธ์ง๋ฅผ ๋ถ์์ ํค์ผ๋ก ๋ณ๊ฒฝํด์ฃผ์ธ์. ์ ์ฒด์ ์ธ ์์์ ๋ถ์ ๊ณ์ด๋ก ์กฐ์ ํ๊ณ ์์ฐ์ค๋ฌ์ด ๋๋์ ์ ์งํด์ฃผ์ธ์."
|
96 |
+
|
97 |
+
# ๋ช
ํํ ์ด๋ฏธ์ง ์์ฑ ์์ฒญ ์ถ๊ฐ
|
98 |
prompt += " ์ด๋ฏธ์ง๋ฅผ ์์ฑํด์ฃผ์ธ์."
|
99 |
+
|
100 |
return prompt
|
101 |
|
102 |
+
def generate_with_images(prompt, images):
|
103 |
"""
|
104 |
+
๊ณต์ ๋ฌธ์์ ๊ธฐ๋ฐํ ์ฌ๋ฐ๋ฅธ API ํธ์ถ ๋ฐฉ์ ๊ตฌํ
|
|
|
|
|
105 |
"""
|
106 |
try:
|
107 |
+
# API ํค ํ์ธ
|
108 |
api_key = os.environ.get("GEMINI_API_KEY")
|
109 |
if not api_key:
|
110 |
return None, "API ํค๊ฐ ์ค์ ๋์ง ์์์ต๋๋ค. ํ๊ฒฝ๋ณ์๋ฅผ ํ์ธํด์ฃผ์ธ์."
|
111 |
+
|
112 |
+
# Gemini ํด๋ผ์ด์ธํธ ์ด๊ธฐํ
|
113 |
client = genai.Client(api_key=api_key)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
114 |
|
115 |
+
logger.info(f"Gemini API ์์ฒญ ์์ - ํ๋กฌํํธ: {prompt}")
|
116 |
+
|
117 |
+
# ์ปจํ
์ธ ์ค๋น
|
118 |
+
contents = []
|
119 |
+
|
120 |
+
# ํ
์คํธ ํ๋กฌํํธ ์ถ๊ฐ
|
121 |
+
contents.append(prompt)
|
122 |
+
|
123 |
+
# ์ด๋ฏธ์ง ์ถ๊ฐ
|
124 |
for idx, img in enumerate(images, 1):
|
125 |
if img is not None:
|
126 |
contents.append(img)
|
127 |
logger.info(f"์ด๋ฏธ์ง #{idx} ์ถ๊ฐ๋จ")
|
128 |
+
|
129 |
+
# ์์ฑ ์ค์ - ๊ณต์ ๋ฌธ์์ ๋ฐ๋ผ responseModalities ์ค์
|
130 |
response = client.models.generate_content(
|
131 |
model="gemini-2.0-flash-exp-image-generation",
|
132 |
contents=contents,
|
|
|
138 |
max_output_tokens=8192
|
139 |
)
|
140 |
)
|
141 |
+
|
142 |
+
# ์์ ํ์ผ ์์ฑ
|
143 |
with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
|
144 |
temp_path = tmp.name
|
145 |
+
|
146 |
result_text = ""
|
147 |
image_found = False
|
148 |
+
|
149 |
+
# ์๋ต ์ฒ๋ฆฌ
|
150 |
for part in response.candidates[0].content.parts:
|
151 |
if hasattr(part, 'text') and part.text:
|
152 |
result_text += part.text
|
|
|
155 |
save_binary_file(temp_path, part.inline_data.data)
|
156 |
image_found = True
|
157 |
logger.info("์๋ต์์ ์ด๋ฏธ์ง ์ถ์ถ ์ฑ๊ณต")
|
158 |
+
|
159 |
if not image_found:
|
160 |
return None, f"API์์ ์ด๋ฏธ์ง๋ฅผ ์์ฑํ์ง ๋ชปํ์ต๋๋ค. ์๋ต ํ
์คํธ: {result_text}"
|
161 |
+
|
162 |
+
# ๊ฒฐ๊ณผ ์ด๋ฏธ์ง ๋ฐํ
|
163 |
result_img = Image.open(temp_path)
|
164 |
if result_img.mode == "RGBA":
|
165 |
result_img = result_img.convert("RGB")
|
166 |
|
|
|
|
|
|
|
|
|
167 |
return result_img, f"์ด๋ฏธ์ง๊ฐ ์ฑ๊ณต์ ์ผ๋ก ์์ฑ๋์์ต๋๋ค. {result_text}"
|
168 |
+
|
169 |
except Exception as e:
|
170 |
logger.exception("์ด๋ฏธ์ง ์์ฑ ์ค ์ค๋ฅ ๋ฐ์:")
|
171 |
return None, f"์ค๋ฅ ๋ฐ์: {str(e)}"
|
172 |
|
173 |
+
def process_images_with_prompt(image1, image2, image3, prompt):
|
174 |
"""
|
175 |
+
3๊ฐ์ ์ด๋ฏธ์ง์ ํ๋กฌํํธ๋ฅผ ์ฒ๋ฆฌํ๋ ํจ์
|
|
|
176 |
"""
|
177 |
try:
|
178 |
+
# ์ด๋ฏธ์ง ๊ฐ์ ํ์ธ
|
179 |
images = [image1, image2, image3]
|
180 |
valid_images = [img for img in images if img is not None]
|
181 |
+
|
182 |
if not valid_images:
|
183 |
+
return None, "์ ์ด๋ ํ๋์ ์ด๋ฏธ์ง๋ฅผ ์
๋ก๋ํด์ฃผ์ธ์."
|
184 |
+
|
185 |
+
# ํ๋กฌํํธ ์ฒ๋ฆฌ
|
186 |
+
if not prompt or not prompt.strip():
|
187 |
+
# ํ๋กฌํํธ๊ฐ ์์ผ๋ฉด ์
๋ก๋๋ ์ด๋ฏธ์ง ์์ ๋ฐ๋ผ ์๋ ํฉ์ฑ ํ๋กฌํํธ ์์ฑ
|
|
|
|
|
|
|
|
|
188 |
if len(valid_images) == 1:
|
189 |
+
prompt = "์ด ์ด๋ฏธ์ง๋ฅผ ์ฐฝ์์ ์ผ๋ก ๋ณํํด์ฃผ์ธ์. ๋ ์์ํ๊ณ ์์ ์ ์ธ ๋ฒ์ ์ผ๋ก ๋ง๋ค์ด์ฃผ์ธ์."
|
190 |
+
logger.info("๋จ์ผ ์ด๋ฏธ์ง ํ๋กฌํํธ ์๋ ์์ฑ")
|
191 |
elif len(valid_images) == 2:
|
192 |
+
prompt = "์ด ๋ ์ด๋ฏธ์ง๋ฅผ ์์ฐ์ค๋ฝ๊ฒ ํฉ์ฑํด์ฃผ์ธ์. ๋ ์ด๋ฏธ์ง์ ์์๋ฅผ ์กฐํ๋กญ๊ฒ ํตํฉํ์ฌ ํ๋์ ์ด๋ฏธ์ง๋ก ๋ง๋ค์ด์ฃผ์ธ์."
|
193 |
+
logger.info("๋ ์ด๋ฏธ์ง ํฉ์ฑ ํ๋กฌํํธ ์๋ ์์ฑ")
|
194 |
else:
|
195 |
+
prompt = "์ด ์ธ ์ด๋ฏธ์ง๋ฅผ ์ฐฝ์์ ์ผ๋ก ํฉ์ฑํด์ฃผ์ธ์. ๋ชจ๋ ์ด๋ฏธ์ง์ ์ฃผ์ ์์๋ฅผ ํฌํจํ๋ ์์ฐ์ค๋ฝ๊ณ ์ผ๊ด๋ ํ๋์ ์ฅ๋ฉด์ผ๋ก ๋ง๋ค์ด์ฃผ์ธ์."
|
196 |
+
logger.info("์ธ ์ด๋ฏธ์ง ํฉ์ฑ ํ๋กฌํํธ ์๋ ์์ฑ")
|
197 |
+
else:
|
198 |
+
# ํ๋กฌํํธ ์ ์ฒ๋ฆฌ ๋ฐ ๊ธฐ๋ฅ ๋ช
๋ น ํด์
|
199 |
+
prompt = preprocess_prompt(prompt, image1, image2, image3)
|
200 |
+
|
201 |
+
# ์๋ก์ด API ํธ์ถ ๋ฐฉ์ ์ฌ์ฉ
|
202 |
+
return generate_with_images(prompt, valid_images)
|
203 |
+
|
204 |
except Exception as e:
|
205 |
logger.exception("์ด๋ฏธ์ง ์ฒ๋ฆฌ ์ค ์ค๋ฅ ๋ฐ์:")
|
206 |
+
return None, f"์ค๋ฅ ๋ฐ์: {str(e)}"
|
207 |
|
208 |
+
# ๊ธฐ๋ฅ ์ ํ ์ฝ๋ฐฑ (๊ธฐ์กด ์ฝ๋ ์ ์ง)
|
209 |
+
def update_prompt_from_function(function_choice, custom_text=""):
|
210 |
+
function_templates = {
|
211 |
+
"1. ์ด๋ฏธ์ง ๋ณ๊ฒฝ": f'#1์ "{custom_text if custom_text else "์ํ๋ ์ค๋ช
"}"์ผ๋ก ๋ฐ๊ฟ๋ผ',
|
212 |
+
"2. ๊ธ์์ง์ฐ๊ธฐ": f'#1์์ "{custom_text if custom_text else "์ง์ธ ํ
์คํธ"}"๋ฅผ ์ง์๋ผ',
|
213 |
+
"3. ์ผ๊ตด๋ฐ๊พธ๊ธฐ": "#1์ ์ธ๋ฌผ์ #2์ ์ผ๊ตด๋ก ๋ฐ๊ฟ๋ผ",
|
214 |
+
"4. ์ท๋ฐ๊พธ๊ธฐ": "#1์ ์ธ๋ฌผ์ #2 ๋๋ #3์ ์ท์ผ๋ก ๋ณ๊ฒฝํ๋ผ",
|
215 |
+
"5. ๋ฐฐ๊ฒฝ๋ฐ๊พธ๊ธฐ": "#1์ ์ด๋ฏธ์ง์ #2์ ๋ฐฐ๊ฒฝ์ผ๋ก ์์ฐ์ค๋ฝ๊ฒ ๋ฐ๊ฟ๋ผ",
|
216 |
+
"6. ์ด๋ฏธ์ง ํฉ์ฑ(์ํํฌํจ)": "#1์ #2 ๋๋ #3์ ๋ฅผ ํฉ์ฑํ๋ผ",
|
217 |
+
"7. ์ด๋ฏธ์ง ํฉ์ฑ(์คํ์ผ์ ์ฉ)": "#1์ #2๋ฅผ ์คํ์ผ๋ก ๋ณํํ๋ผ"
|
218 |
+
}
|
219 |
|
220 |
+
return function_templates.get(function_choice, "")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
221 |
|
222 |
+
# Gradio ์ธํฐํ์ด์ค (๊ธฐ์กด ์ฝ๋ ์ ์ง)
|
223 |
+
with gr.Blocks() as demo:
|
224 |
+
gr.HTML(
|
225 |
+
"""
|
226 |
+
<div style="text-align: center; margin-bottom: 1rem;">
|
227 |
+
<h1>๊ฐ๋จํ ์ด๋ฏธ์ง ์์ฑ๊ธฐ</h1>
|
228 |
+
<p>์ด๋ฏธ์ง๋ฅผ ์
๋ก๋ํ๏ฟฝ๏ฟฝ ๋ฐ๋ก ์คํํ๋ฉด ์๋์ผ๋ก ํฉ์ฑํฉ๋๋ค. ๋๋ ์๋ ๊ธฐ๋ฅ์ ์ ํํ ์ ์์ต๋๋ค.</p>
|
229 |
+
</div>
|
230 |
+
"""
|
231 |
+
)
|
232 |
+
|
233 |
+
with gr.Row():
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
234 |
with gr.Column():
|
235 |
+
# 3๊ฐ์ ์ด๋ฏธ์ง ์
๋ ฅ
|
236 |
with gr.Row():
|
237 |
+
image1_input = gr.Image(type="pil", label="#1", image_mode="RGB")
|
238 |
+
image2_input = gr.Image(type="pil", label="#2", image_mode="RGB")
|
239 |
+
image3_input = gr.Image(type="pil", label="#3", image_mode="RGB")
|
240 |
+
|
241 |
+
# ๊ธฐ๋ฅ ์ ํ ๋๋กญ๋ค์ด๊ณผ ์ปค์คํ
ํ
์คํธ ์
๋ ฅ
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
242 |
with gr.Row():
|
243 |
+
function_dropdown = gr.Dropdown(
|
244 |
+
choices=[
|
245 |
+
"1. ์ด๋ฏธ์ง ๋ณ๊ฒฝ",
|
246 |
+
"2. ๊ธ์์ง์ฐ๊ธฐ",
|
247 |
+
"3. ์ผ๊ตด๋ฐ๊พธ๊ธฐ",
|
248 |
+
"4. ์ท๋ฐ๊พธ๊ธฐ",
|
249 |
+
"5. ๋ฐฐ๊ฒฝ๋ฐ๊พธ๊ธฐ",
|
250 |
+
"6. ์ด๋ฏธ์ง ํฉ์ฑ(์ํํฌํจ)",
|
251 |
+
"7. ์ด๋ฏธ์ง ํฉ์ฑ(์คํ์ผ์ ์ฉ)"
|
252 |
+
],
|
253 |
+
label="๊ธฐ๋ฅ ์ ํ",
|
254 |
+
value=None
|
255 |
+
)
|
256 |
+
custom_text_input = gr.Textbox(
|
257 |
+
label="์ปค์คํ
ํ
์คํธ (1, 2๋ฒ ๊ธฐ๋ฅ์ฉ)",
|
258 |
+
placeholder="์: ๋ถ์์, ์์ฑํ ์คํ์ผ, ์ค๊ตญ์ด..."
|
259 |
+
)
|
260 |
+
|
261 |
+
apply_function_btn = gr.Button("๊ธฐ๋ฅ ์ ์ฉ")
|
262 |
+
|
263 |
+
# ํ๋กฌํํธ ์
๋ ฅ (์ ํ ์ฌํญ)
|
264 |
+
prompt_input = gr.Textbox(
|
265 |
+
lines=3,
|
266 |
+
placeholder="ํ๋กฌํํธ๋ฅผ ์
๋ ฅํ๊ฑฐ๋ ๋น์๋๋ฉด ์๋ ํฉ์ฑ๋ฉ๋๋ค.",
|
267 |
+
label="ํ๋กฌํํธ (์ ํ ์ฌํญ)"
|
268 |
+
)
|
269 |
+
|
270 |
+
# ์์ฑ ๋ฒํผ
|
271 |
+
submit_btn = gr.Button("์ด๋ฏธ์ง ์์ฑ", variant="primary")
|
272 |
|
|
|
273 |
with gr.Column():
|
274 |
+
# ๊ฒฐ๊ณผ ์ถ๋ ฅ
|
275 |
+
output_image = gr.Image(label="์์ฑ๋ ์ด๋ฏธ์ง")
|
276 |
+
output_text = gr.Textbox(label="์ํ ๋ฉ์์ง")
|
277 |
+
|
278 |
+
# ์ฌ์ฉ๋ ํ๋กฌํํธ ํ์
|
279 |
+
prompt_display = gr.Textbox(label="์ฌ์ฉ๋ ํ๋กฌํํธ", visible=True)
|
|
|
|
|
|
|
|
|
280 |
|
281 |
+
# ๊ธฐ๋ฅ ์ ์ฉ ๋ฒํผ ์ด๋ฒคํธ
|
282 |
+
apply_function_btn.click(
|
283 |
+
fn=update_prompt_from_function,
|
284 |
+
inputs=[function_dropdown, custom_text_input],
|
285 |
+
outputs=[prompt_input]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
286 |
)
|
287 |
|
288 |
+
# ์ด๋ฏธ์ง ์์ฑ ๋ฒํผ ํด๋ฆญ ์ด๋ฒคํธ
|
289 |
+
def process_and_show_prompt(image1, image2, image3, prompt):
|
290 |
+
# ์ด๋ฏธ์ง ๊ฐ์ ํ์ธ
|
291 |
+
images = [image1, image2, image3]
|
292 |
+
valid_images = [img for img in images if img is not None]
|
293 |
+
|
294 |
+
try:
|
295 |
+
# ์๋ ํ๋กฌํํธ ์์ฑ ๋๋ ํ๋กฌํํธ ์ ์ฒ๋ฆฌ
|
296 |
+
auto_prompt = prompt
|
297 |
+
if not prompt or not prompt.strip():
|
298 |
+
if len(valid_images) == 1:
|
299 |
+
auto_prompt = "์ด ์ด๋ฏธ์ง๋ฅผ ์ฐฝ์์ ์ผ๋ก ๋ณํํด์ฃผ์ธ์. ๋ ์์ํ๊ณ ์์ ์ ์ธ ๋ฒ์ ์ผ๋ก ๋ง๋ค์ด์ฃผ์ธ์."
|
300 |
+
elif len(valid_images) == 2:
|
301 |
+
auto_prompt = "์ด ๋ ์ด๋ฏธ์ง๋ฅผ ์์ฐ์ค๋ฝ๊ฒ ํฉ์ฑํด์ฃผ์ธ์. ๋ ์ด๋ฏธ์ง์ ์์๋ฅผ ์กฐํ๋กญ๊ฒ ํตํฉํ์ฌ ํ๋์ ์ด๋ฏธ์ง๋ก ๋ง๋ค์ด์ฃผ์ธ์."
|
302 |
+
else:
|
303 |
+
auto_prompt = "์ด ์ธ ์ด๋ฏธ์ง๋ฅผ ์ฐฝ์์ ์ผ๋ก ํฉ์ฑํด์ฃผ์ธ์. ๋ชจ๋ ์ด๋ฏธ์ง์ ์ฃผ์ ์์๋ฅผ ํฌํจํ๋ ์์ฐ์ค๋ฝ๊ณ ์ผ๊ด๋ ํ๋์ ์ฅ๋ฉด์ผ๋ก ๋ง๋ค์ด์ฃผ์ธ์."
|
304 |
+
else:
|
305 |
+
auto_prompt = preprocess_prompt(prompt, image1, image2, image3)
|
306 |
+
|
307 |
+
# ์ด๋ฏธ์ง ์์ฑ ํจ์ ํธ์ถ
|
308 |
+
result_img, status = process_images_with_prompt(image1, image2, image3, prompt)
|
309 |
+
|
310 |
+
return result_img, status, auto_prompt
|
311 |
+
except Exception as e:
|
312 |
+
logger.exception("์ฒ๋ฆฌ ์ค ์ค๋ฅ ๋ฐ์:")
|
313 |
+
return None, f"์ค๋ฅ ๋ฐ์: {str(e)}", prompt
|
314 |
+
|
315 |
submit_btn.click(
|
316 |
+
fn=process_and_show_prompt,
|
317 |
inputs=[image1_input, image2_input, image3_input, prompt_input],
|
318 |
+
outputs=[output_image, output_text, prompt_display],
|
319 |
)
|
320 |
+
|
321 |
gr.Markdown(
|
322 |
"""
|
323 |
### ์ฌ์ฉ ๋ฐฉ๋ฒ:
|
324 |
|
325 |
+
1. **์๋ ํฉ์ฑ**: ์ด๋ฏธ์ง๋ง ์
๋ก๋ํ๊ณ ํ๋กฌํํธ๋ฅผ ๋น์๋๋ฉด ์๋์ผ๋ก ํฉ์ฑ๋ฉ๋๋ค
|
326 |
+
2. **๊ธฐ๋ฅ ์ฌ์ฉ**: ๋๋กญ๋ค์ด์์ ์ํ๋ ๊ธฐ๋ฅ์ ์ ํํ๊ณ '๊ธฐ๋ฅ ์ ์ฉ' ๋ฒํผ์ ํด๋ฆญํ์ธ์
|
327 |
+
3. **์ปค์คํ
ํ
์คํธ**: ์ด๋ฏธ์ง ๋ณ๊ฒฝ์ด๋ ๊ธ์์ง์ฐ๊ธฐ ๊ธฐ๋ฅ์ ์ ํํ ๋ ์ถ๊ฐ ์ค๋ช
์ ์
๋ ฅํ ์ ์์ต๋๋ค
|
328 |
+
4. **์ด๋ฏธ์ง ์ฐธ์กฐ**: #1, #2, #3์ผ๋ก ๊ฐ ์ด๋ฏธ์ง๋ฅผ ์ฐธ์กฐํ ์ ์์ต๋๋ค
|
329 |
+
5. **์ผ๋ถ ์ด๋ฏธ์ง๋ง**: ํ์ํ ์ด๋ฏธ์ง๋ง ์
๋ก๋ํด๋ ๊ธฐ๋ฅ ์คํ์ด ๊ฐ๋ฅํฉ๋๋ค
|
330 |
|
331 |
+
> **ํ**: ๊ธฐ๋ฅ์ ์ ํํ ํ์๋ ํ๋กฌํํธ๋ฅผ ์ง์ ์์ ํ ์ ์์ต๋๋ค
|
332 |
"""
|
333 |
)
|
334 |
|
335 |
+
# ์ ํ๋ฆฌ์ผ์ด์
์คํ
|
336 |
if __name__ == "__main__":
|
337 |
demo.launch(share=True)
|