segmentation-api

Paused

App Files Files

jbilcke-hf commited on Jul 26, 2023

Commit

2f2223a

1 Parent(s): f1d2589

Update app.py

Browse files

Files changed (1) hide show

app.py +37 -39

app.py CHANGED Viewed

@@ -554,7 +554,7 @@ def run_anything_task(input_image, text_prompt, box_threshold, text_threshold, i
         groundingdino_model, image, text_prompt, box_threshold, text_threshold, device=groundingdino_device
     )
     if boxes_filt.size(0) == 0:
-        logger.info(f'run_anything_task_[{file_temp}]_{task_type}_[{text_prompt}]_1_[No objects detected, please try others.]_')
         return [], gr.Gallery.update(label='No objects detected, please try others.😂😂😂😂')
     boxes_filt_ori = copy.deepcopy(boxes_filt)
@@ -565,44 +565,42 @@ def run_anything_task(input_image, text_prompt, box_threshold, text_threshold, i
     }
     # disabled: we don't want to see the boxes
-    # image_with_box = plot_boxes_to_image(copy.deepcopy(image_pil), pred_dict)[0]
-    # output_images.append(image_with_box)
-    if task_type == 'segment':
-        image = np.array(input_img)
-        sam_predictor.set_image(image)
-        H, W = size[1], size[0]
-        for i in range(boxes_filt.size(0)):
-            boxes_filt[i] = boxes_filt[i] * torch.Tensor([W, H, W, H])
-            boxes_filt[i][:2] -= boxes_filt[i][2:] / 2
-            boxes_filt[i][2:] += boxes_filt[i][:2]
-        boxes_filt = boxes_filt.to(sam_device)
-        transformed_boxes = sam_predictor.transform.apply_boxes_torch(boxes_filt, image.shape[:2])
-        masks, _, _, _ = sam_predictor.predict_torch(
-            point_coords = None,
-            point_labels = None,
-            boxes = transformed_boxes,
-            multimask_output = False,
-        )
-        # masks: [9, 1, 512, 512]
-        assert sam_checkpoint, 'sam_checkpoint is not found!'
-        # draw output image
-        plt.figure(figsize=(10, 10))
-        plt.imshow(image)
-        for mask in masks:
-            show_mask(mask.cpu().numpy(), plt.gca(), random_color=True)
-        for box, label in zip(boxes_filt, pred_phrases):
-            show_box(box.cpu().numpy(), plt.gca(), label)
-        plt.axis('off')
-        image_path = os.path.join(output_dir, f"grounding_seg_output_{file_temp}.jpg")
-        plt.savefig(image_path, bbox_inches="tight")
-        segment_image_result = cv2.cvtColor(cv2.imread(image_path), cv2.COLOR_BGR2RGB)
-        os.remove(image_path)
-        output_images.append(segment_image_result)
     results = zip(boxes_filt, pred_phrases)

         groundingdino_model, image, text_prompt, box_threshold, text_threshold, device=groundingdino_device
     )
     if boxes_filt.size(0) == 0:
+        logger.info(f'run_anything_task_[{file_temp}]_[{text_prompt}]_1_[No objects detected, please try others.]_')
         return [], gr.Gallery.update(label='No objects detected, please try others.😂😂😂😂')
     boxes_filt_ori = copy.deepcopy(boxes_filt)
     }
     # disabled: we don't want to see the boxes
+    image_with_box = plot_boxes_to_image(copy.deepcopy(image_pil), pred_dict)[0]
+    output_images.append(image_with_box)
+    image = np.array(input_img)
+    sam_predictor.set_image(image)
+    H, W = size[1], size[0]
+    for i in range(boxes_filt.size(0)):
+        boxes_filt[i] = boxes_filt[i] * torch.Tensor([W, H, W, H])
+        boxes_filt[i][:2] -= boxes_filt[i][2:] / 2
+        boxes_filt[i][2:] += boxes_filt[i][:2]
+    boxes_filt = boxes_filt.to(sam_device)
+    transformed_boxes = sam_predictor.transform.apply_boxes_torch(boxes_filt, image.shape[:2])
+    masks, _, _, _ = sam_predictor.predict_torch(
+        point_coords = None,
+        point_labels = None,
+        boxes = transformed_boxes,
+        multimask_output = False,
+    )
+    # masks: [9, 1, 512, 512]
+    assert sam_checkpoint, 'sam_checkpoint is not found!'
+    # draw output image
+    plt.figure(figsize=(10, 10))
+    plt.imshow(image)
+    for mask in masks:
+        show_mask(mask.cpu().numpy(), plt.gca(), random_color=True)
+    for box, label in zip(boxes_filt, pred_phrases):
+        show_box(box.cpu().numpy(), plt.gca(), label)
+    plt.axis('off')
+    image_path = os.path.join(output_dir, f"grounding_seg_output_{file_temp}.jpg")
+    plt.savefig(image_path, bbox_inches="tight")
+    segment_image_result = cv2.cvtColor(cv2.imread(image_path), cv2.COLOR_BGR2RGB)
+    os.remove(image_path)
+    output_images.append(segment_image_result)
     results = zip(boxes_filt, pred_phrases)