Spaces:
Running
on
Zero
Running
on
Zero
try this
Browse files
app.py
CHANGED
@@ -83,6 +83,7 @@ def process(
|
|
83 |
dino_labled_img, label_coordinates, parsed_content_list = get_som_labeled_img(image_save_path, yolo_model, BOX_TRESHOLD = box_threshold, output_coord_in_ratio=False, ocr_bbox=ocr_bbox,draw_bbox_config=draw_bbox_config, caption_model_processor=caption_model_processor, ocr_text=text,iou_threshold=iou_threshold)
|
84 |
image = Image.open(io.BytesIO(base64.b64decode(dino_labled_img)))
|
85 |
print('finish processing')
|
|
|
86 |
|
87 |
# Format the coordinates output in a more readable way
|
88 |
# coordinates_text = "Bounding Box Coordinates (x, y, width, height):\n"
|
@@ -91,27 +92,8 @@ def process(
|
|
91 |
# coords_list = coords.tolist()
|
92 |
# coords_formatted = [f"{coord:.1f}" for coord in coords_list]
|
93 |
# coordinates_text += f"Box {box_id}: [{coords_formatted[0]}, {coords_formatted[1]}, {coords_formatted[2]}, {coords_formatted[3]}]\n"
|
94 |
-
|
95 |
-
combined_content = []
|
96 |
-
for i, content in enumerate(parsed_content_list):
|
97 |
-
if content.startswith('Text Box ID'):
|
98 |
-
box_id = str(i)
|
99 |
-
else:
|
100 |
-
# Extract the ID number from Icon Box ID format
|
101 |
-
box_id = content.split('Icon Box ID ')[1].split(':')[0]
|
102 |
|
103 |
-
|
104 |
-
if coords is not None: # Changed from 'if coords:' to handle numpy arrays
|
105 |
-
coords_str = [round(x) for x in coords] # Convert numpy values to rounded integers
|
106 |
-
combined_content.append(f"{content} | Coordinates: {coords_str}")
|
107 |
-
else:
|
108 |
-
combined_content.append(content)
|
109 |
-
|
110 |
-
# Join the content lists into strings
|
111 |
-
parsed_content_str = '\n'.join(parsed_content_list)
|
112 |
-
combined_content_str = '\n'.join(combined_content)
|
113 |
-
|
114 |
-
return image, parsed_content_str, combined_content_str
|
115 |
|
116 |
|
117 |
with gr.Blocks() as demo:
|
|
|
83 |
dino_labled_img, label_coordinates, parsed_content_list = get_som_labeled_img(image_save_path, yolo_model, BOX_TRESHOLD = box_threshold, output_coord_in_ratio=False, ocr_bbox=ocr_bbox,draw_bbox_config=draw_bbox_config, caption_model_processor=caption_model_processor, ocr_text=text,iou_threshold=iou_threshold)
|
84 |
image = Image.open(io.BytesIO(base64.b64decode(dino_labled_img)))
|
85 |
print('finish processing')
|
86 |
+
parsed_content_list = '\n'.join(parsed_content_list)
|
87 |
|
88 |
# Format the coordinates output in a more readable way
|
89 |
# coordinates_text = "Bounding Box Coordinates (x, y, width, height):\n"
|
|
|
92 |
# coords_list = coords.tolist()
|
93 |
# coords_formatted = [f"{coord:.1f}" for coord in coords_list]
|
94 |
# coordinates_text += f"Box {box_id}: [{coords_formatted[0]}, {coords_formatted[1]}, {coords_formatted[2]}, {coords_formatted[3]}]\n"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
95 |
|
96 |
+
return image, str(parsed_content_list), str(label_coordinates)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
97 |
|
98 |
|
99 |
with gr.Blocks() as demo:
|