derekalia commited on
Commit
69842c6
·
1 Parent(s): 4020710
Files changed (1) hide show
  1. app.py +2 -20
app.py CHANGED
@@ -83,6 +83,7 @@ def process(
83
  dino_labled_img, label_coordinates, parsed_content_list = get_som_labeled_img(image_save_path, yolo_model, BOX_TRESHOLD = box_threshold, output_coord_in_ratio=False, ocr_bbox=ocr_bbox,draw_bbox_config=draw_bbox_config, caption_model_processor=caption_model_processor, ocr_text=text,iou_threshold=iou_threshold)
84
  image = Image.open(io.BytesIO(base64.b64decode(dino_labled_img)))
85
  print('finish processing')
 
86
 
87
  # Format the coordinates output in a more readable way
88
  # coordinates_text = "Bounding Box Coordinates (x, y, width, height):\n"
@@ -91,27 +92,8 @@ def process(
91
  # coords_list = coords.tolist()
92
  # coords_formatted = [f"{coord:.1f}" for coord in coords_list]
93
  # coordinates_text += f"Box {box_id}: [{coords_formatted[0]}, {coords_formatted[1]}, {coords_formatted[2]}, {coords_formatted[3]}]\n"
94
-
95
- combined_content = []
96
- for i, content in enumerate(parsed_content_list):
97
- if content.startswith('Text Box ID'):
98
- box_id = str(i)
99
- else:
100
- # Extract the ID number from Icon Box ID format
101
- box_id = content.split('Icon Box ID ')[1].split(':')[0]
102
 
103
- coords = label_coordinates.get(box_id)
104
- if coords is not None: # Changed from 'if coords:' to handle numpy arrays
105
- coords_str = [round(x) for x in coords] # Convert numpy values to rounded integers
106
- combined_content.append(f"{content} | Coordinates: {coords_str}")
107
- else:
108
- combined_content.append(content)
109
-
110
- # Join the content lists into strings
111
- parsed_content_str = '\n'.join(parsed_content_list)
112
- combined_content_str = '\n'.join(combined_content)
113
-
114
- return image, parsed_content_str, combined_content_str
115
 
116
 
117
  with gr.Blocks() as demo:
 
83
  dino_labled_img, label_coordinates, parsed_content_list = get_som_labeled_img(image_save_path, yolo_model, BOX_TRESHOLD = box_threshold, output_coord_in_ratio=False, ocr_bbox=ocr_bbox,draw_bbox_config=draw_bbox_config, caption_model_processor=caption_model_processor, ocr_text=text,iou_threshold=iou_threshold)
84
  image = Image.open(io.BytesIO(base64.b64decode(dino_labled_img)))
85
  print('finish processing')
86
+ parsed_content_list = '\n'.join(parsed_content_list)
87
 
88
  # Format the coordinates output in a more readable way
89
  # coordinates_text = "Bounding Box Coordinates (x, y, width, height):\n"
 
92
  # coords_list = coords.tolist()
93
  # coords_formatted = [f"{coord:.1f}" for coord in coords_list]
94
  # coordinates_text += f"Box {box_id}: [{coords_formatted[0]}, {coords_formatted[1]}, {coords_formatted[2]}, {coords_formatted[3]}]\n"
 
 
 
 
 
 
 
 
95
 
96
+ return image, str(parsed_content_list), str(label_coordinates)
 
 
 
 
 
 
 
 
 
 
 
97
 
98
 
99
  with gr.Blocks() as demo: