SegmentAnythingxGroundingDINO

Sleeping

waleko commited on Oct 16, 2023

Commit

9016294

•

1 Parent(s): ea0da2a

change json + description change

Files changed (1) hide show

app.py CHANGED Viewed

@@ -100,7 +100,7 @@ def detect_objects(image, prompt, show_masks=True, show_boxes=True, crop_options
     output_image_paths = []
-    for i, (input_box, label) in enumerate(zip(boxes, labels)):
         x1, y1, x2, y2 = input_box
         width = x2 - x1
         height = y2 - y1
@@ -143,10 +143,14 @@ def detect_objects(image, prompt, show_masks=True, show_boxes=True, crop_options
         output_image_paths.append(output_image_path)
         # save object information in json
-        res_json["objects"].append(
-            {"label": label, "score": np.max(scores).item(), "box": input_box.tolist(),
-             "center": center_point.tolist(),
-             "avg_size": avg_size})
     return [res_json, output_image_paths]
@@ -171,9 +175,8 @@ app = gr.Interface(
         ["images/penguin.png", "penguin"],
         ["images/penn.jpg", "sign board"]
     ],
-    title="Segment Anything: Animal Edition",
-    description="Zero-Shot Object Detection, Segmentation and Cropping",
-    article="https://segment-anything.com",
 )
 app.launch()

     output_image_paths = []
+    for i, (input_box, label, phrase, logit) in enumerate(zip(boxes, labels, phrases, logits.tolist())):
         x1, y1, x2, y2 = input_box
         width = x2 - x1
         height = y2 - y1
         output_image_paths.append(output_image_path)
         # save object information in json
+        res_json["objects"].append({
+            "label": phrase,
+            "dino_score": logit,
+            "sam_score": np.max(scores).item(),
+            "box": input_box.tolist(),
+            "center": center_point.tolist(),
+            "avg_size": avg_size
+        })
     return [res_json, output_image_paths]
         ["images/penguin.png", "penguin"],
         ["images/penn.jpg", "sign board"]
     ],
+    title="Object Detection, Segmentation and Cropping",
+    description="This app uses DINO to detect objects in an image and then uses SAM to segment and crop the objects.",
 )
 app.launch()