Spaces:

jackyccl
/

segment-anything

Runtime error

App Files Files Community

jackyccl commited on Apr 22, 2023

Commit

f80c1b9

1 Parent(s): 7b58807

fix bugs

Browse files

Files changed (1) hide show

app.py +10 -5

app.py CHANGED Viewed

@@ -137,15 +137,20 @@ def show_mask(mask, ax, random_color=False):
 def show_box(box, ax, label):
     x0, y0 = box[0], box[1]
     w, h = box[2] - box[0], box[3] - box[1]
-    ax.add_patch(plt.Rectangle((x0, y0), w, h, edgecolor='green', facecolor=(0,0,0,0), lw=2))
-    ax.text(x0, y0, label, fontdict={'fontsize': 7})
 def get_grounding_box(image_tensor, grounding_caption, box_threshold, text_threshold):
     # run grounding
     boxes, logits, phrases = predict(groundingDino_model, image_tensor, grounding_caption, box_threshold, text_threshold, device=groundingdino_device)
     # annotated_frame = annotate(image_source=np.asarray(image_pil), boxes=boxes, logits=logits, phrases=phrases)
     # image_with_box = Image.fromarray(cv2.cvtColor(annotated_frame, cv2.COLOR_BGR2RGB))
-    return boxes, phrases
 def grounding_sam(input_image, text_prompt, task_type, box_threshold, text_threshold, iou_threshold):
     text_prompt = text_prompt.strip()
@@ -210,7 +215,7 @@ def grounding_sam(input_image, text_prompt, task_type, box_threshold, text_thres
         )
         # draw output image
-        plt.figure(figsize=(10, 10))
         plt.imshow(image)
         for mask in masks:
             show_mask(mask.cpu().numpy(), plt.gca(), random_color=True)
@@ -246,7 +251,7 @@ if __name__ == "__main__":
                 input_image = gr.Image(source='upload', elem_id="image_upload", tool='sketch', type='pil', label="Upload")
                 task_type = gr.Radio(["segment"],  value="segment",
                                                 label='Task type',interactive=True, visible=True)
-                text_prompt = gr.Textbox(label="Detection Prompt, seperating each name with ',', i.e.: cat,dog,chair ]", \
                                          placeholder="Cannot be empty")
                 run_button = gr.Button(label="Run")

 def show_box(box, ax, label):
     x0, y0 = box[0], box[1]
     w, h = box[2] - box[0], box[3] - box[1]
+    ax.add_patch(plt.Rectangle((x0, y0), w, h, edgecolor='red', facecolor=(0,0,0,0), lw=2))
+    ax.text(x0, y0+20, label, fontdict={'fontsize': 10}, color="white")
 def get_grounding_box(image_tensor, grounding_caption, box_threshold, text_threshold):
     # run grounding
     boxes, logits, phrases = predict(groundingDino_model, image_tensor, grounding_caption, box_threshold, text_threshold, device=groundingdino_device)
+    labels = [
+        f"{phrase} ({logit:.2f})"
+        for phrase, logit
+        in zip(phrases, logits)
+    ]
     # annotated_frame = annotate(image_source=np.asarray(image_pil), boxes=boxes, logits=logits, phrases=phrases)
     # image_with_box = Image.fromarray(cv2.cvtColor(annotated_frame, cv2.COLOR_BGR2RGB))
+    return boxes, labels
 def grounding_sam(input_image, text_prompt, task_type, box_threshold, text_threshold, iou_threshold):
     text_prompt = text_prompt.strip()
         )
         # draw output image
+        plt.figure()
         plt.imshow(image)
         for mask in masks:
             show_mask(mask.cpu().numpy(), plt.gca(), random_color=True)
                 input_image = gr.Image(source='upload', elem_id="image_upload", tool='sketch', type='pil', label="Upload")
                 task_type = gr.Radio(["segment"],  value="segment",
                                                 label='Task type',interactive=True, visible=True)
+                text_prompt = gr.Textbox(label="Detection Prompt, seperating each name with dot '.', i.e.: cat.dog.chair ]", \
                                          placeholder="Cannot be empty")
                 run_button = gr.Button(label="Run")