Spaces:
Running
Running
Upload app.py
Browse files
app.py
CHANGED
@@ -14,10 +14,6 @@ def pil_to_bytes(img, format="PNG"):
|
|
14 |
img.save(img_byte_arr, format=format)
|
15 |
return img_byte_arr.getvalue()
|
16 |
|
17 |
-
# Function to save API key in browser local storage
|
18 |
-
def save_api_key(api_key):
|
19 |
-
return api_key
|
20 |
-
|
21 |
# Function to load image as base64
|
22 |
async def load_image_base64(img):
|
23 |
if isinstance(img, str):
|
@@ -28,7 +24,7 @@ async def load_image_base64(img):
|
|
28 |
return pil_to_bytes(img)
|
29 |
|
30 |
# Main function to generate edited image using Gemini
|
31 |
-
async def generate_image_gemini(prompt, image, api_key):
|
32 |
SAFETY_SETTINGS = {
|
33 |
types.HarmCategory.HARM_CATEGORY_HARASSMENT: types.HarmBlockThreshold.BLOCK_NONE,
|
34 |
types.HarmCategory.HARM_CATEGORY_HATE_SPEECH: types.HarmBlockThreshold.BLOCK_NONE,
|
@@ -73,6 +69,7 @@ async def generate_image_gemini(prompt, image, api_key):
|
|
73 |
model="gemini-2.0-flash-exp",
|
74 |
contents=contents,
|
75 |
config=types.GenerateContentConfig(
|
|
|
76 |
safety_settings=[
|
77 |
types.SafetySetting(
|
78 |
category=category, threshold=threshold
|
@@ -100,7 +97,7 @@ async def generate_image_gemini(prompt, image, api_key):
|
|
100 |
return None
|
101 |
|
102 |
# Function to process the image edit
|
103 |
-
def process_image_edit(image, prompt, api_key, image_history):
|
104 |
if not image or not prompt or not api_key:
|
105 |
return None, image_history, "Please provide an image, prompt, and API key"
|
106 |
|
@@ -112,7 +109,7 @@ def process_image_edit(image, prompt, api_key, image_history):
|
|
112 |
|
113 |
# Run the async function to edit the image
|
114 |
try:
|
115 |
-
edited_image = asyncio.run(generate_image_gemini(prompt, image, api_key))
|
116 |
if edited_image:
|
117 |
return edited_image, image_history, "Image edited successfully"
|
118 |
else:
|
@@ -132,46 +129,35 @@ def undo_edit(image_history):
|
|
132 |
|
133 |
# Create Gradio UI
|
134 |
def create_ui():
|
135 |
-
with gr.Blocks(title="Gemini Image Editor"
|
136 |
-
function() {
|
137 |
-
// Wait for the DOM to be fully loaded
|
138 |
-
window.addEventListener('DOMContentLoaded', (event) => {
|
139 |
-
setTimeout(function() {
|
140 |
-
// Try to load saved API key from localStorage
|
141 |
-
const savedKey = localStorage.getItem('gemini_api_key');
|
142 |
-
const apiKeyInput = document.querySelector('input[placeholder="Enter your Gemini API key"]');
|
143 |
-
if (savedKey && apiKeyInput) {
|
144 |
-
apiKeyInput.value = savedKey;
|
145 |
-
// Dispatch an input event to make sure Gradio recognizes the change
|
146 |
-
const event = new Event('input', { bubbles: true });
|
147 |
-
apiKeyInput.dispatchEvent(event);
|
148 |
-
}
|
149 |
-
|
150 |
-
// Add event listener to save API key when checkbox is checked
|
151 |
-
const saveKeyCheckbox = document.querySelector('input[type="checkbox"]');
|
152 |
-
if (apiKeyInput && saveKeyCheckbox) {
|
153 |
-
apiKeyInput.addEventListener('change', function(e) {
|
154 |
-
if (saveKeyCheckbox.checked) {
|
155 |
-
localStorage.setItem('gemini_api_key', e.target.value);
|
156 |
-
}
|
157 |
-
});
|
158 |
-
}
|
159 |
-
}, 1000); // Small delay to ensure elements are loaded
|
160 |
-
});
|
161 |
-
}
|
162 |
-
""") as app:
|
163 |
gr.Markdown("# Gemini Image Editor")
|
164 |
gr.Markdown("Upload an image, enter a description of the edit you want, and let Gemini do the rest!")
|
165 |
|
166 |
# Store image history in state
|
167 |
image_history = gr.State([])
|
168 |
|
|
|
|
|
|
|
169 |
with gr.Row():
|
170 |
with gr.Column():
|
171 |
input_image = gr.Image(type="pil", label="Upload Image")
|
172 |
prompt = gr.Textbox(label="Edit Description", placeholder="Describe the edit you want...")
|
173 |
api_key = gr.Textbox(label="Gemini API Key", placeholder="Enter your Gemini API key", type="password")
|
174 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
175 |
|
176 |
with gr.Row():
|
177 |
edit_btn = gr.Button("Edit Image")
|
@@ -181,10 +167,20 @@ def create_ui():
|
|
181 |
output_image = gr.Image(type="pil", label="Edited Image")
|
182 |
status = gr.Textbox(label="Status", interactive=False)
|
183 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
184 |
# Set up event handlers
|
185 |
edit_btn.click(
|
186 |
fn=process_image_edit,
|
187 |
-
inputs=[input_image, prompt, api_key, image_history],
|
188 |
outputs=[output_image, image_history, status]
|
189 |
)
|
190 |
|
|
|
14 |
img.save(img_byte_arr, format=format)
|
15 |
return img_byte_arr.getvalue()
|
16 |
|
|
|
|
|
|
|
|
|
17 |
# Function to load image as base64
|
18 |
async def load_image_base64(img):
|
19 |
if isinstance(img, str):
|
|
|
24 |
return pil_to_bytes(img)
|
25 |
|
26 |
# Main function to generate edited image using Gemini
|
27 |
+
async def generate_image_gemini(prompt, image, api_key, temperature=0.4):
|
28 |
SAFETY_SETTINGS = {
|
29 |
types.HarmCategory.HARM_CATEGORY_HARASSMENT: types.HarmBlockThreshold.BLOCK_NONE,
|
30 |
types.HarmCategory.HARM_CATEGORY_HATE_SPEECH: types.HarmBlockThreshold.BLOCK_NONE,
|
|
|
69 |
model="gemini-2.0-flash-exp",
|
70 |
contents=contents,
|
71 |
config=types.GenerateContentConfig(
|
72 |
+
temperature=temperature,
|
73 |
safety_settings=[
|
74 |
types.SafetySetting(
|
75 |
category=category, threshold=threshold
|
|
|
97 |
return None
|
98 |
|
99 |
# Function to process the image edit
|
100 |
+
def process_image_edit(image, prompt, api_key, image_history, temperature):
|
101 |
if not image or not prompt or not api_key:
|
102 |
return None, image_history, "Please provide an image, prompt, and API key"
|
103 |
|
|
|
109 |
|
110 |
# Run the async function to edit the image
|
111 |
try:
|
112 |
+
edited_image = asyncio.run(generate_image_gemini(prompt, image, api_key, temperature))
|
113 |
if edited_image:
|
114 |
return edited_image, image_history, "Image edited successfully"
|
115 |
else:
|
|
|
129 |
|
130 |
# Create Gradio UI
|
131 |
def create_ui():
|
132 |
+
with gr.Blocks(title="Gemini Image Editor") as app:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
133 |
gr.Markdown("# Gemini Image Editor")
|
134 |
gr.Markdown("Upload an image, enter a description of the edit you want, and let Gemini do the rest!")
|
135 |
|
136 |
# Store image history in state
|
137 |
image_history = gr.State([])
|
138 |
|
139 |
+
# Settings visibility state
|
140 |
+
settings_visible = gr.State(False)
|
141 |
+
|
142 |
with gr.Row():
|
143 |
with gr.Column():
|
144 |
input_image = gr.Image(type="pil", label="Upload Image")
|
145 |
prompt = gr.Textbox(label="Edit Description", placeholder="Describe the edit you want...")
|
146 |
api_key = gr.Textbox(label="Gemini API Key", placeholder="Enter your Gemini API key", type="password")
|
147 |
+
|
148 |
+
# Settings button and panel
|
149 |
+
settings_btn = gr.Button("⚙️ Settings", scale=0.15)
|
150 |
+
|
151 |
+
with gr.Column(visible=False) as settings_panel:
|
152 |
+
gr.Markdown("### Advanced Settings")
|
153 |
+
temperature = gr.Slider(
|
154 |
+
minimum=0.0,
|
155 |
+
maximum=2.0,
|
156 |
+
value=0.4,
|
157 |
+
step=0.05,
|
158 |
+
label="Temperature",
|
159 |
+
info="Controls randomness in generation (0 = deterministic, 1 = creative, 2 = extreme)"
|
160 |
+
)
|
161 |
|
162 |
with gr.Row():
|
163 |
edit_btn = gr.Button("Edit Image")
|
|
|
167 |
output_image = gr.Image(type="pil", label="Edited Image")
|
168 |
status = gr.Textbox(label="Status", interactive=False)
|
169 |
|
170 |
+
# Toggle settings visibility
|
171 |
+
def toggle_settings(visible):
|
172 |
+
return not visible, not visible
|
173 |
+
|
174 |
+
settings_btn.click(
|
175 |
+
fn=toggle_settings,
|
176 |
+
inputs=[settings_visible],
|
177 |
+
outputs=[settings_visible, settings_panel]
|
178 |
+
)
|
179 |
+
|
180 |
# Set up event handlers
|
181 |
edit_btn.click(
|
182 |
fn=process_image_edit,
|
183 |
+
inputs=[input_image, prompt, api_key, image_history, temperature],
|
184 |
outputs=[output_image, image_history, status]
|
185 |
)
|
186 |
|