wilwork commited on
Commit
cf16f32
·
verified ·
1 Parent(s): cf604df

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +53 -38
app.py CHANGED
@@ -7,23 +7,36 @@ import numpy as np
7
  # Load JinaAI CLIP model
8
  model = AutoModel.from_pretrained('jinaai/jina-clip-v1', trust_remote_code=True)
9
 
10
- def compute_similarity(input1, input2):
11
  """
12
  Computes similarity between:
13
- - Image and Text
14
- - Image and Image
15
- - Text and Text
16
  """
17
-
18
- # Detect input types
19
- input1_is_text = isinstance(input1, str) and input1.strip() != ""
20
- input2_is_text = isinstance(input2, str) and input2.strip() != ""
21
- input1_is_image = isinstance(input1, np.ndarray)
22
- input2_is_image = isinstance(input2, np.ndarray)
 
 
 
 
 
 
 
 
 
 
 
 
 
23
 
24
  # Ensure valid input
25
  if not (input1_is_text or input1_is_image) or not (input2_is_text or input2_is_image):
26
- return "Error: Both inputs must be valid (image or text)!"
27
 
28
  try:
29
  with torch.no_grad():
@@ -59,32 +72,34 @@ def compute_similarity(input1, input2):
59
  return f"Error: {str(e)}"
60
 
61
  # Gradio UI
62
- demo = gr.Interface(
63
- fn=compute_similarity,
64
- inputs=[
65
- gr.Radio(["Text", "Image"], label="Input 1 Type", value="Text"),
66
- gr.Textbox(label="Text Input 1", visible=True),
67
- gr.Image(type="numpy", label="Image Input 1", visible=False),
68
-
69
- gr.Radio(["Text", "Image"], label="Input 2 Type", value="Text"),
70
- gr.Textbox(label="Text Input 2", visible=True),
71
- gr.Image(type="numpy", label="Image Input 2", visible=False),
72
- ],
73
- outputs=gr.Textbox(label="Similarity Score / Error", interactive=False),
74
- title="JinaAI CLIP Multimodal Similarity",
75
- description="Compare similarity between two inputs (Text, Image, or both)."
76
- )
77
-
78
- # Update visibility dynamically
79
- def update_visibility(input1_type, input2_type):
80
- return (
81
- input1_type == "Text", # Text input 1 visibility
82
- input1_type == "Image", # Image input 1 visibility
83
- input2_type == "Text", # Text input 2 visibility
84
- input2_type == "Image" # Image input 2 visibility
85
- )
86
-
87
- # Add event handlers for input type change
88
- demo.load(update_visibility, inputs=["Input 1 Type", "Input 2 Type"], outputs=["Text Input 1", "Image Input 1", "Text Input 2", "Image Input 2"])
 
 
89
 
90
  demo.launch()
 
7
  # Load JinaAI CLIP model
8
  model = AutoModel.from_pretrained('jinaai/jina-clip-v1', trust_remote_code=True)
9
 
10
+ def compute_similarity(input1_type, input1_text, input1_image, input2_type, input2_text, input2_image):
11
  """
12
  Computes similarity between:
13
+ - Text-Text
14
+ - Image-Image
15
+ - Text-Image & Image-Text
16
  """
17
+
18
+ # Determine input types
19
+ if input1_type == "Text":
20
+ input1 = input1_text.strip()
21
+ input1_is_text = bool(input1)
22
+ input1_is_image = False
23
+ else:
24
+ input1 = input1_image
25
+ input1_is_text = False
26
+ input1_is_image = input1 is not None
27
+
28
+ if input2_type == "Text":
29
+ input2 = input2_text.strip()
30
+ input2_is_text = bool(input2)
31
+ input2_is_image = False
32
+ else:
33
+ input2 = input2_image
34
+ input2_is_text = False
35
+ input2_is_image = input2 is not None
36
 
37
  # Ensure valid input
38
  if not (input1_is_text or input1_is_image) or not (input2_is_text or input2_is_image):
39
+ return "Error: Please provide valid inputs (text or image) for both fields!"
40
 
41
  try:
42
  with torch.no_grad():
 
72
  return f"Error: {str(e)}"
73
 
74
  # Gradio UI
75
+ with gr.Blocks() as demo:
76
+ gr.Markdown("# JinaAI CLIP Multimodal Similarity")
77
+ gr.Markdown("Compare similarity between two inputs: **Text-Text, Image-Image, or Image-Text**.")
78
+
79
+ with gr.Row():
80
+ input1_type = gr.Radio(["Text", "Image"], label="Input 1 Type", value="Text")
81
+ input2_type = gr.Radio(["Text", "Image"], label="Input 2 Type", value="Text")
82
+
83
+ input1_text = gr.Textbox(label="Input 1 (Text)", visible=True)
84
+ input1_image = gr.Image(type="numpy", label="Input 1 (Image)", visible=False)
85
+
86
+ input2_text = gr.Textbox(label="Input 2 (Text)", visible=True)
87
+ input2_image = gr.Image(type="numpy", label="Input 2 (Image)", visible=False)
88
+
89
+ output = gr.Textbox(label="Similarity Score / Error", interactive=False)
90
+
91
+ def update_visibility(input1_type, input2_type):
92
+ return (
93
+ input1_type == "Text", # Input 1 text visibility
94
+ input1_type == "Image", # Input 1 image visibility
95
+ input2_type == "Text", # Input 2 text visibility
96
+ input2_type == "Image" # Input 2 image visibility
97
+ )
98
+
99
+ input1_type.change(update_visibility, inputs=[input1_type, input2_type], outputs=[input1_text, input1_image, input2_text, input2_image])
100
+ input2_type.change(update_visibility, inputs=[input1_type, input2_type], outputs=[input1_text, input1_image, input2_text, input2_image])
101
+
102
+ compute_button = gr.Button("Compute Similarity")
103
+ compute_button.click(compute_similarity, inputs=[input1_type, input1_text, input1_image, input2_type, input2_text, input2_image], outputs=output)
104
 
105
  demo.launch()