From 625a646520761caeb01bce8007fd5fe0e6ab627c Mon Sep 17 00:00:00 2001
From: Leo Ueno <leo@roboflow.com>
Date: Sat, 30 Nov 2024 21:01:17 -0800
Subject: [PATCH 1/3] Add method

---
 supervision/detection/core.py | 96 +++++++++++++++++++++++++++++++++++
 1 file changed, 96 insertions(+)

diff --git a/supervision/detection/core.py b/supervision/detection/core.py
index 74c663a89..a27825d5a 100644
--- a/supervision/detection/core.py
+++ b/supervision/detection/core.py
@@ -1391,6 +1391,102 @@ def with_nmm(
             result.append(merged_detections)
 
         return Detections.merge(result)
+    
+        @classmethod
+    def from_gcp_vision(cls, gcp_results, size) -> Detections:
+        """
+        Creates a Detections instance from the
+            [Google Cloud Cloud Vision API's](https://cloud.google.com/vision/docs)
+            inference result.
+
+        Args:
+            gcp_results (List[dict]): The output results from GCP from
+                the `localized_object_annotations`.
+            size (Tuple[int, int]): The height, then width of the input image.
+
+        Returns:
+            Detections: A new Detections object.
+
+        Example:
+            ```python
+            >>> import supervision as sv
+            >>> from google.cloud import vision
+            >>> from PIL import Image
+
+            >>> image_path = "/content/people.jpeg"
+            >>> img = Image.open(image_path)
+
+            >>> client = vision.ImageAnnotatorClient()
+
+            >>> with open(image_path, "rb") as image_file:
+            >>>     content = image_file.read()
+
+            >>> image = vision.Image(content=content)
+
+            >>> result = client.object_localization(image=image)
+            >>> objects = result.localized_object_annotations
+
+            >>> detections = sv.Detections.from_gcp_vision(
+            >>>     gcp_results=objects,
+            >>>     size=(img.height, img.width)
+            >>> )
+            ```
+        """
+        xyxys, confidences, class_ids = [], [], []
+
+        class_id_reference = {}
+
+        for object_ in gcp_results:
+            # bounding boxes must be in the format [x0, y0, x1, y1]
+            # not the polygons returned by the GCP Vision API
+
+            object_bboxes = []
+
+            for vertex in object_.bounding_poly.normalized_vertices:
+                object_bboxes.append([vertex.x, vertex.y])
+
+            object_bboxes = np.array(object_bboxes)
+
+            x0 = object_bboxes[:, 0].min()
+            y0 = object_bboxes[:, 1].min()
+            x1 = object_bboxes[:, 0].max()
+            y1 = object_bboxes[:, 1].max()
+
+            height, width = size
+
+            # normalize as image size, not 0-1
+            x0 *= width
+            y0 *= height
+            x1 *= width
+            y1 *= height
+
+            class_name = object_.name
+
+            xyxys.append([x0, y0, x1, y1])
+
+            confidences.append(object_.score)
+
+            if class_id_reference.get(class_name):
+                class_ids.append(class_id_reference[class_name])
+            else:
+                new_id = len(class_id_reference) + 1
+
+                class_id_reference[class_name] = new_id
+
+                class_ids.append(new_id)
+
+        id_to_class_name = {id_: name for name, id_ in class_id_reference.items()}
+        class_names = [id_to_class_name[class_id] for class_id in class_ids]
+
+        if len(xyxys) == 0:
+            return cls.empty()
+
+        return cls(
+            xyxy=np.array(xyxys),
+            class_id=np.array(class_ids),
+            confidence=np.array(confidences),
+            data={CLASS_NAME_DATA_FIELD: np.array(class_names)},
+        )
 
 
 def merge_inner_detection_object_pair(

From d798a658ccfbc77344db40667a596f0a23fb3552 Mon Sep 17 00:00:00 2001
From: "pre-commit-ci[bot]"
 <66853113+pre-commit-ci[bot]@users.noreply.github.com>
Date: Sun, 1 Dec 2024 05:03:20 +0000
Subject: [PATCH 2/3] =?UTF-8?q?fix(pre=5Fcommit):=20=F0=9F=8E=A8=20auto=20?=
 =?UTF-8?q?format=20pre-commit=20hooks?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 supervision/detection/core.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/supervision/detection/core.py b/supervision/detection/core.py
index a27825d5a..9599e8e48 100644
--- a/supervision/detection/core.py
+++ b/supervision/detection/core.py
@@ -1391,7 +1391,7 @@ def with_nmm(
             result.append(merged_detections)
 
         return Detections.merge(result)
-    
+
         @classmethod
     def from_gcp_vision(cls, gcp_results, size) -> Detections:
         """

From 4c92c2da281d29e0c8bff3a69fc6a8958667b433 Mon Sep 17 00:00:00 2001
From: Leo Ueno <leo@roboflow.com>
Date: Sun, 1 Dec 2024 22:27:09 -0800
Subject: [PATCH 3/3] Fix indent

---
 supervision/detection/core.py | 34 +++++++++++++++++++++-------------
 1 file changed, 21 insertions(+), 13 deletions(-)

diff --git a/supervision/detection/core.py b/supervision/detection/core.py
index 9599e8e48..915cfe80b 100644
--- a/supervision/detection/core.py
+++ b/supervision/detection/core.py
@@ -269,9 +269,11 @@ def from_ultralytics(cls, ultralytics_results) -> Detections:
                 xyxy=ultralytics_results.obb.xyxy.cpu().numpy(),
                 confidence=ultralytics_results.obb.conf.cpu().numpy(),
                 class_id=class_id,
-                tracker_id=ultralytics_results.obb.id.int().cpu().numpy()
-                if ultralytics_results.obb.id is not None
-                else None,
+                tracker_id=(
+                    ultralytics_results.obb.id.int().cpu().numpy()
+                    if ultralytics_results.obb.id is not None
+                    else None
+                ),
                 data={
                     ORIENTED_BOX_COORDINATES: oriented_box_coordinates,
                     CLASS_NAME_DATA_FIELD: class_names,
@@ -293,9 +295,11 @@ def from_ultralytics(cls, ultralytics_results) -> Detections:
             confidence=ultralytics_results.boxes.conf.cpu().numpy(),
             class_id=class_id,
             mask=extract_ultralytics_masks(ultralytics_results),
-            tracker_id=ultralytics_results.boxes.id.int().cpu().numpy()
-            if ultralytics_results.boxes.id is not None
-            else None,
+            tracker_id=(
+                ultralytics_results.boxes.id.int().cpu().numpy()
+                if ultralytics_results.boxes.id is not None
+                else None
+            ),
             data={CLASS_NAME_DATA_FIELD: class_names},
         )
 
@@ -447,9 +451,11 @@ def from_mmdetection(cls, mmdet_results) -> Detections:
             xyxy=mmdet_results.pred_instances.bboxes.cpu().numpy(),
             confidence=mmdet_results.pred_instances.scores.cpu().numpy(),
             class_id=mmdet_results.pred_instances.labels.cpu().numpy().astype(int),
-            mask=mmdet_results.pred_instances.masks.cpu().numpy()
-            if "masks" in mmdet_results.pred_instances
-            else None,
+            mask=(
+                mmdet_results.pred_instances.masks.cpu().numpy()
+                if "masks" in mmdet_results.pred_instances
+                else None
+            ),
         )
 
     @classmethod
@@ -567,9 +573,11 @@ class IDs, and confidences of the predictions.
         return cls(
             xyxy=detectron2_results["instances"].pred_boxes.tensor.cpu().numpy(),
             confidence=detectron2_results["instances"].scores.cpu().numpy(),
-            mask=detectron2_results["instances"].pred_masks.cpu().numpy()
-            if hasattr(detectron2_results["instances"], "pred_masks")
-            else None,
+            mask=(
+                detectron2_results["instances"].pred_masks.cpu().numpy()
+                if hasattr(detectron2_results["instances"], "pred_masks")
+                else None
+            ),
             class_id=detectron2_results["instances"]
             .pred_classes.cpu()
             .numpy()
@@ -1392,7 +1400,7 @@ def with_nmm(
 
         return Detections.merge(result)
 
-        @classmethod
+    @classmethod
     def from_gcp_vision(cls, gcp_results, size) -> Detections:
         """
         Creates a Detections instance from the