Update app.py
Browse files
app.py
CHANGED
@@ -21,7 +21,8 @@ def find_similarity(base64_image, text_input):
|
|
21 |
image = Image.open(BytesIO(image_bytes))
|
22 |
|
23 |
# Preprocess the image
|
24 |
-
image = preprocess(image).unsqueeze(0).to(device)
|
|
|
25 |
|
26 |
# Prepare input text
|
27 |
text_tokens = clip.tokenize([text_input]).to(device)
|
@@ -36,7 +37,7 @@ def find_similarity(base64_image, text_input):
|
|
36 |
# Normalize features and calculate similarity
|
37 |
image_features /= image_features.norm(dim=-1, keepdim=True)
|
38 |
text_features /= text_features.norm(dim=-1, keepdim=True)
|
39 |
-
similarity = (text_features @ image_features.T).
|
40 |
|
41 |
return similarity
|
42 |
|
@@ -48,7 +49,6 @@ iface = gr.Interface(
|
|
48 |
"text"
|
49 |
],
|
50 |
outputs="number",
|
51 |
-
live=True,
|
52 |
interpretation="default",
|
53 |
title="CLIP Model Image-Text Cosine Similarity",
|
54 |
description="Upload a base64 image and enter text to find their cosine similarity.",
|
|
|
21 |
image = Image.open(BytesIO(image_bytes))
|
22 |
|
23 |
# Preprocess the image
|
24 |
+
# image = preprocess(image).unsqueeze(0).to(device)
|
25 |
+
image = preprocess(image).to(device)
|
26 |
|
27 |
# Prepare input text
|
28 |
text_tokens = clip.tokenize([text_input]).to(device)
|
|
|
37 |
# Normalize features and calculate similarity
|
38 |
image_features /= image_features.norm(dim=-1, keepdim=True)
|
39 |
text_features /= text_features.norm(dim=-1, keepdim=True)
|
40 |
+
similarity = (text_features @ image_features.T).cpu().numpy()
|
41 |
|
42 |
return similarity
|
43 |
|
|
|
49 |
"text"
|
50 |
],
|
51 |
outputs="number",
|
|
|
52 |
interpretation="default",
|
53 |
title="CLIP Model Image-Text Cosine Similarity",
|
54 |
description="Upload a base64 image and enter text to find their cosine similarity.",
|