saq1b commited on
Commit
f60dff7
·
verified ·
1 Parent(s): 3a6f640

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +33 -37
app.py CHANGED
@@ -14,10 +14,6 @@ def pil_to_bytes(img, format="PNG"):
14
  img.save(img_byte_arr, format=format)
15
  return img_byte_arr.getvalue()
16
 
17
- # Function to save API key in browser local storage
18
- def save_api_key(api_key):
19
- return api_key
20
-
21
  # Function to load image as base64
22
  async def load_image_base64(img):
23
  if isinstance(img, str):
@@ -28,7 +24,7 @@ async def load_image_base64(img):
28
  return pil_to_bytes(img)
29
 
30
  # Main function to generate edited image using Gemini
31
- async def generate_image_gemini(prompt, image, api_key):
32
  SAFETY_SETTINGS = {
33
  types.HarmCategory.HARM_CATEGORY_HARASSMENT: types.HarmBlockThreshold.BLOCK_NONE,
34
  types.HarmCategory.HARM_CATEGORY_HATE_SPEECH: types.HarmBlockThreshold.BLOCK_NONE,
@@ -73,6 +69,7 @@ async def generate_image_gemini(prompt, image, api_key):
73
  model="gemini-2.0-flash-exp",
74
  contents=contents,
75
  config=types.GenerateContentConfig(
 
76
  safety_settings=[
77
  types.SafetySetting(
78
  category=category, threshold=threshold
@@ -100,7 +97,7 @@ async def generate_image_gemini(prompt, image, api_key):
100
  return None
101
 
102
  # Function to process the image edit
103
- def process_image_edit(image, prompt, api_key, image_history):
104
  if not image or not prompt or not api_key:
105
  return None, image_history, "Please provide an image, prompt, and API key"
106
 
@@ -112,7 +109,7 @@ def process_image_edit(image, prompt, api_key, image_history):
112
 
113
  # Run the async function to edit the image
114
  try:
115
- edited_image = asyncio.run(generate_image_gemini(prompt, image, api_key))
116
  if edited_image:
117
  return edited_image, image_history, "Image edited successfully"
118
  else:
@@ -132,46 +129,35 @@ def undo_edit(image_history):
132
 
133
  # Create Gradio UI
134
  def create_ui():
135
- with gr.Blocks(title="Gemini Image Editor", js="""
136
- function() {
137
- // Wait for the DOM to be fully loaded
138
- window.addEventListener('DOMContentLoaded', (event) => {
139
- setTimeout(function() {
140
- // Try to load saved API key from localStorage
141
- const savedKey = localStorage.getItem('gemini_api_key');
142
- const apiKeyInput = document.querySelector('input[placeholder="Enter your Gemini API key"]');
143
- if (savedKey && apiKeyInput) {
144
- apiKeyInput.value = savedKey;
145
- // Dispatch an input event to make sure Gradio recognizes the change
146
- const event = new Event('input', { bubbles: true });
147
- apiKeyInput.dispatchEvent(event);
148
- }
149
-
150
- // Add event listener to save API key when checkbox is checked
151
- const saveKeyCheckbox = document.querySelector('input[type="checkbox"]');
152
- if (apiKeyInput && saveKeyCheckbox) {
153
- apiKeyInput.addEventListener('change', function(e) {
154
- if (saveKeyCheckbox.checked) {
155
- localStorage.setItem('gemini_api_key', e.target.value);
156
- }
157
- });
158
- }
159
- }, 1000); // Small delay to ensure elements are loaded
160
- });
161
- }
162
- """) as app:
163
  gr.Markdown("# Gemini Image Editor")
164
  gr.Markdown("Upload an image, enter a description of the edit you want, and let Gemini do the rest!")
165
 
166
  # Store image history in state
167
  image_history = gr.State([])
168
 
 
 
 
169
  with gr.Row():
170
  with gr.Column():
171
  input_image = gr.Image(type="pil", label="Upload Image")
172
  prompt = gr.Textbox(label="Edit Description", placeholder="Describe the edit you want...")
173
  api_key = gr.Textbox(label="Gemini API Key", placeholder="Enter your Gemini API key", type="password")
174
- save_key = gr.Checkbox(label="Save API key in browser", value=True)
 
 
 
 
 
 
 
 
 
 
 
 
 
175
 
176
  with gr.Row():
177
  edit_btn = gr.Button("Edit Image")
@@ -181,10 +167,20 @@ def create_ui():
181
  output_image = gr.Image(type="pil", label="Edited Image")
182
  status = gr.Textbox(label="Status", interactive=False)
183
 
 
 
 
 
 
 
 
 
 
 
184
  # Set up event handlers
185
  edit_btn.click(
186
  fn=process_image_edit,
187
- inputs=[input_image, prompt, api_key, image_history],
188
  outputs=[output_image, image_history, status]
189
  )
190
 
 
14
  img.save(img_byte_arr, format=format)
15
  return img_byte_arr.getvalue()
16
 
 
 
 
 
17
  # Function to load image as base64
18
  async def load_image_base64(img):
19
  if isinstance(img, str):
 
24
  return pil_to_bytes(img)
25
 
26
  # Main function to generate edited image using Gemini
27
+ async def generate_image_gemini(prompt, image, api_key, temperature=0.4):
28
  SAFETY_SETTINGS = {
29
  types.HarmCategory.HARM_CATEGORY_HARASSMENT: types.HarmBlockThreshold.BLOCK_NONE,
30
  types.HarmCategory.HARM_CATEGORY_HATE_SPEECH: types.HarmBlockThreshold.BLOCK_NONE,
 
69
  model="gemini-2.0-flash-exp",
70
  contents=contents,
71
  config=types.GenerateContentConfig(
72
+ temperature=temperature,
73
  safety_settings=[
74
  types.SafetySetting(
75
  category=category, threshold=threshold
 
97
  return None
98
 
99
  # Function to process the image edit
100
+ def process_image_edit(image, prompt, api_key, image_history, temperature):
101
  if not image or not prompt or not api_key:
102
  return None, image_history, "Please provide an image, prompt, and API key"
103
 
 
109
 
110
  # Run the async function to edit the image
111
  try:
112
+ edited_image = asyncio.run(generate_image_gemini(prompt, image, api_key, temperature))
113
  if edited_image:
114
  return edited_image, image_history, "Image edited successfully"
115
  else:
 
129
 
130
  # Create Gradio UI
131
  def create_ui():
132
+ with gr.Blocks(title="Gemini Image Editor") as app:
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
133
  gr.Markdown("# Gemini Image Editor")
134
  gr.Markdown("Upload an image, enter a description of the edit you want, and let Gemini do the rest!")
135
 
136
  # Store image history in state
137
  image_history = gr.State([])
138
 
139
+ # Settings visibility state
140
+ settings_visible = gr.State(False)
141
+
142
  with gr.Row():
143
  with gr.Column():
144
  input_image = gr.Image(type="pil", label="Upload Image")
145
  prompt = gr.Textbox(label="Edit Description", placeholder="Describe the edit you want...")
146
  api_key = gr.Textbox(label="Gemini API Key", placeholder="Enter your Gemini API key", type="password")
147
+
148
+ # Settings button and panel
149
+ settings_btn = gr.Button("⚙️ Settings", scale=0.15)
150
+
151
+ with gr.Column(visible=False) as settings_panel:
152
+ gr.Markdown("### Advanced Settings")
153
+ temperature = gr.Slider(
154
+ minimum=0.0,
155
+ maximum=2.0,
156
+ value=0.4,
157
+ step=0.05,
158
+ label="Temperature",
159
+ info="Controls randomness in generation (0 = deterministic, 1 = creative, 2 = extreme)"
160
+ )
161
 
162
  with gr.Row():
163
  edit_btn = gr.Button("Edit Image")
 
167
  output_image = gr.Image(type="pil", label="Edited Image")
168
  status = gr.Textbox(label="Status", interactive=False)
169
 
170
+ # Toggle settings visibility
171
+ def toggle_settings(visible):
172
+ return not visible, not visible
173
+
174
+ settings_btn.click(
175
+ fn=toggle_settings,
176
+ inputs=[settings_visible],
177
+ outputs=[settings_visible, settings_panel]
178
+ )
179
+
180
  # Set up event handlers
181
  edit_btn.click(
182
  fn=process_image_edit,
183
+ inputs=[input_image, prompt, api_key, image_history, temperature],
184
  outputs=[output_image, image_history, status]
185
  )
186