Core

Detections¶

Data class containing information about the detections in a video frame. Attributes: xyxy (np.ndarray): An array of shape (n, 4) containing the bounding boxes coordinates in format [x1, y1, x2, y2] mask: (Optional[np.ndarray]): An array of shape (n, W, H) containing the segmentation masks. confidence (Optional[np.ndarray]): An array of shape (n,) containing the confidence scores of the detections. class_id (Optional[np.ndarray]): An array of shape (n,) containing the class ids of the detections. tracker_id (Optional[np.ndarray]): An array of shape (n,) containing the tracker ids of the detections.

Source code in supervision/detection/core.py

@dataclass
class Detections:
    """
    Data class containing information about the detections in a video frame.
    Attributes:
        xyxy (np.ndarray): An array of shape `(n, 4)` containing the bounding boxes coordinates in format `[x1, y1, x2, y2]`
        mask: (Optional[np.ndarray]): An array of shape `(n, W, H)` containing the segmentation masks.
        confidence (Optional[np.ndarray]): An array of shape `(n,)` containing the confidence scores of the detections.
        class_id (Optional[np.ndarray]): An array of shape `(n,)` containing the class ids of the detections.
        tracker_id (Optional[np.ndarray]): An array of shape `(n,)` containing the tracker ids of the detections.
    """

    xyxy: np.ndarray
    mask: np.Optional[np.ndarray] = None
    confidence: Optional[np.ndarray] = None
    class_id: Optional[np.ndarray] = None
    tracker_id: Optional[np.ndarray] = None

    def __post_init__(self):
        n = len(self.xyxy)
        _validate_xyxy(xyxy=self.xyxy, n=n)
        _validate_mask(mask=self.mask, n=n)
        _validate_class_id(class_id=self.class_id, n=n)
        _validate_confidence(confidence=self.confidence, n=n)
        _validate_tracker_id(tracker_id=self.tracker_id, n=n)

    def __len__(self):
        """
        Returns the number of detections in the Detections object.
        """
        return len(self.xyxy)

    def __iter__(
        self,
    ) -> Iterator[
        Tuple[
            np.ndarray,
            Optional[np.ndarray],
            Optional[float],
            Optional[int],
            Optional[int],
        ]
    ]:
        """
        Iterates over the Detections object and yield a tuple of `(xyxy, mask, confidence, class_id, tracker_id)` for each detection.
        """
        for i in range(len(self.xyxy)):
            yield (
                self.xyxy[i],
                self.mask[i] if self.mask is not None else None,
                self.confidence[i] if self.confidence is not None else None,
                self.class_id[i] if self.class_id is not None else None,
                self.tracker_id[i] if self.tracker_id is not None else None,
            )

    def __eq__(self, other: Detections):
        return all(
            [
                np.array_equal(self.xyxy, other.xyxy),
                any(
                    [
                        self.mask is None and other.mask is None,
                        np.array_equal(self.mask, other.mask),
                    ]
                ),
                any(
                    [
                        self.class_id is None and other.class_id is None,
                        np.array_equal(self.class_id, other.class_id),
                    ]
                ),
                any(
                    [
                        self.confidence is None and other.confidence is None,
                        np.array_equal(self.confidence, other.confidence),
                    ]
                ),
                any(
                    [
                        self.tracker_id is None and other.tracker_id is None,
                        np.array_equal(self.tracker_id, other.tracker_id),
                    ]
                ),
            ]
        )

    @classmethod
    def from_yolov5(cls, yolov5_results) -> Detections:
        """
        Creates a Detections instance from a [YOLOv5](https://github.com/ultralytics/yolov5) inference result.

        Args:
            yolov5_results (yolov5.models.common.Detections): The output Detections instance from YOLOv5

        Returns:
            Detections: A new Detections object.

        Example:
            ```python
            >>> import cv2
            >>> import torch
            >>> import supervision as sv

            >>> image = cv2.imread(SOURCE_IMAGE_PATH)
            >>> model = torch.hub.load('ultralytics/yolov5', 'yolov5s')
            >>> result = model(image)
            >>> detections = sv.Detections.from_yolov5(result)
            ```
        """
        yolov5_detections_predictions = yolov5_results.pred[0].cpu().cpu().numpy()
        return cls(
            xyxy=yolov5_detections_predictions[:, :4],
            confidence=yolov5_detections_predictions[:, 4],
            class_id=yolov5_detections_predictions[:, 5].astype(int),
        )

    @classmethod
    def from_yolov8(cls, yolov8_results) -> Detections:
        """
        Creates a Detections instance from a [YOLOv8](https://github.com/ultralytics/ultralytics) inference result.

        Args:
            yolov8_results (ultralytics.yolo.engine.results.Results): The output Results instance from YOLOv8

        Returns:
            Detections: A new Detections object.

        Example:
            ```python
            >>> import cv2
            >>> from ultralytics import YOLO
            >>> import supervision as sv

            >>> image = cv2.imread(SOURCE_IMAGE_PATH)
            >>> model = YOLO('yolov8s.pt')
            >>> result = model(image)[0]
            >>> detections = sv.Detections.from_yolov8(result)
            ```
        """
        return cls(
            xyxy=yolov8_results.boxes.xyxy.cpu().numpy(),
            confidence=yolov8_results.boxes.conf.cpu().numpy(),
            class_id=yolov8_results.boxes.cls.cpu().numpy().astype(int),
            mask=extract_yolov8_masks(yolov8_results),
        )

    @classmethod
    def from_yolo_nas(cls, yolo_nas_results) -> Detections:
        """
        Creates a Detections instance from a [YOLO-NAS](https://github.com/Deci-AI/super-gradients/blob/master/YOLONAS.md) inference result.

        Args:
            yolo_nas_results (super_gradients.training.models.prediction_results.ImageDetectionPrediction): The output Results instance from YOLO-NAS

        Returns:
            Detections: A new Detections object.

        Example:
            ```python
            >>> import cv2
            >>> from super_gradients.training import models
            >>> import supervision as sv

            >>> image = cv2.imread(SOURCE_IMAGE_PATH)
            >>> model = models.get('yolo_nas_l', pretrained_weights="coco")
            >>> result = list(model.predict(image, conf=0.35))[0]
            >>> detections = sv.Detections.from_yolo_nas(result)
            ```
        """
        return cls(
            xyxy=yolo_nas_results.prediction.bboxes_xyxy,
            confidence=yolo_nas_results.prediction.confidence,
            class_id=yolo_nas_results.prediction.labels.astype(int),
        )

    @classmethod
    def from_transformers(cls, transformers_results: dict) -> Detections:
        """
        Creates a Detections instance from object detection [transformer](https://github.com/huggingface/transformers) inference result.

        Returns:
            Detections: A new Detections object.
        """
        return cls(
            xyxy=transformers_results["boxes"].cpu().numpy(),
            confidence=transformers_results["scores"].cpu().numpy(),
            class_id=transformers_results["labels"].cpu().numpy().astype(int),
        )

    @classmethod
    def from_detectron2(cls, detectron2_results) -> Detections:
        """
        Create a Detections object from the [Detectron2](https://github.com/facebookresearch/detectron2) inference result.

        Args:
            detectron2_results: The output of a Detectron2 model containing instances with prediction data.

        Returns:
            (Detections): A Detections object containing the bounding boxes, class IDs, and confidences of the predictions.

        Example:
            ```python
            >>> import cv2
            >>> from detectron2.engine import DefaultPredictor
            >>> from detectron2.config import get_cfg
            >>> import supervision as sv

            >>> image = cv2.imread(SOURCE_IMAGE_PATH)
            >>> cfg = get_cfg()
            >>> cfg.merge_from_file("path/to/config.yaml")
            >>> cfg.MODEL.WEIGHTS = "path/to/model_weights.pth"
            >>> predictor = DefaultPredictor(cfg)
            >>> result = predictor(image)

            >>> detections = sv.Detections.from_detectron2(result)
            ```
        """
        return cls(
            xyxy=detectron2_results["instances"].pred_boxes.tensor.cpu().numpy(),
            confidence=detectron2_results["instances"].scores.cpu().numpy(),
            class_id=detectron2_results["instances"]
            .pred_classes.cpu()
            .numpy()
            .astype(int),
        )

    @classmethod
    def from_roboflow(cls, roboflow_result: dict, class_list: List[str]) -> Detections:
        """
        Create a Detections object from the [Roboflow](https://roboflow.com/) API inference result.

        Args:
            roboflow_result (dict): The result from the Roboflow API containing predictions.
            class_list (List[str]): A list of class names corresponding to the class IDs in the API result.

        Returns:
            (Detections): A Detections object containing the bounding boxes, class IDs, and confidences of the predictions.

        Example:
            ```python
            >>> import supervision as sv

            >>> roboflow_result = {
            ...     "predictions": [
            ...         {
            ...             "x": 0.5,
            ...             "y": 0.5,
            ...             "width": 0.2,
            ...             "height": 0.3,
            ...             "class": "person",
            ...             "confidence": 0.9
            ...         },
            ...         # ... more predictions ...
            ...     ]
            ... }
            >>> class_list = ["person", "car", "dog"]

            >>> detections = sv.Detections.from_roboflow(roboflow_result, class_list)
            ```
        """
        xyxy = []
        confidence = []
        class_id = []

        for prediction in roboflow_result["predictions"]:
            x = prediction["x"]
            y = prediction["y"]
            width = prediction["width"]
            height = prediction["height"]
            x_min = x - width / 2
            y_min = y - height / 2
            x_max = x_min + width
            y_max = y_min + height
            xyxy.append([x_min, y_min, x_max, y_max])
            class_id.append(class_list.index(prediction["class"]))
            confidence.append(prediction["confidence"])

        return Detections(
            xyxy=np.array(xyxy),
            confidence=np.array(confidence),
            class_id=np.array(class_id).astype(int),
        )

    @classmethod
    def from_sam(cls, sam_result: List[dict]) -> Detections:
        """
        Creates a Detections instance from [Segment Anything Model](https://github.com/facebookresearch/segment-anything) inference result.

        Args:
            sam_result (List[dict]): The output Results instance from SAM

        Returns:
            Detections: A new Detections object.

        Example:
            ```python
            >>> import supervision as sv
            >>> from segment_anything import sam_model_registry, SamAutomaticMaskGenerator

            >>> sam = sam_model_registry[MODEL_TYPE](checkpoint=CHECKPOINT_PATH).to(device=DEVICE)
            >>> mask_generator = SamAutomaticMaskGenerator(sam)
            >>> sam_result = mask_generator.generate(IMAGE)
            >>> detections = sv.Detections.from_sam(sam_result=sam_result)
            ```
        """
        sorted_generated_masks = sorted(
            sam_result, key=lambda x: x["area"], reverse=True
        )

        xywh = np.array([mask["bbox"] for mask in sorted_generated_masks])
        mask = np.array([mask["segmentation"] for mask in sorted_generated_masks])

        return Detections(xyxy=xywh_to_xyxy(boxes_xywh=xywh), mask=mask)

    @classmethod
    @deprecated(
        "Dataset loading and saving is going to be executed by supervision.dataset.core.Dataset"
    )
    def from_coco_annotations(cls, coco_annotation: dict) -> Detections:
        xyxy, class_id = [], []

        for annotation in coco_annotation:
            x_min, y_min, width, height = annotation["bbox"]
            xyxy.append([x_min, y_min, x_min + width, y_min + height])
            class_id.append(annotation["category_id"])

        return cls(xyxy=np.array(xyxy), class_id=np.array(class_id))

    @classmethod
    def empty(cls) -> Detections:
        """
        Create an empty Detections object with no bounding boxes, confidences, or class IDs.

        Returns:
            (Detections): An empty Detections object.

        Example:
            ```python
            >>> from supervision import Detections

            >>> empty_detections = Detections.empty()
            ```
        """
        return cls(
            xyxy=np.empty((0, 4), dtype=np.float32),
            confidence=np.array([], dtype=np.float32),
            class_id=np.array([], dtype=int),
        )

    @classmethod
    def merge(cls, detections_list: List[Detections]) -> Detections:
        """
        Merge a list of Detections objects into a single Detections object.

        This method takes a list of Detections objects and combines their respective fields (`xyxy`, `mask`,
        `confidence`, `class_id`, and `tracker_id`) into a single Detections object. If all elements in a field are not
        `None`, the corresponding field will be stacked. Otherwise, the field will be set to `None`.

        Args:
            detections_list (List[Detections]): A list of Detections objects to merge.

        Returns:
            (Detections): A single Detections object containing the merged data from the input list.

        Example:
            ```python
            >>> from supervision import Detections

            >>> detections_1 = Detections(...)
            >>> detections_2 = Detections(...)

            >>> merged_detections = Detections.merge([detections_1, detections_2])
            ```
        """
        if len(detections_list) == 0:
            return Detections.empty()

        detections_tuples_list = [astuple(detection) for detection in detections_list]
        xyxy, mask, confidence, class_id, tracker_id = [
            list(field) for field in zip(*detections_tuples_list)
        ]

        all_not_none = lambda l: all(x is not None for x in l)

        xyxy = np.vstack(xyxy)
        mask = np.vstack(mask) if all_not_none(mask) else None
        confidence = np.hstack(confidence) if all_not_none(confidence) else None
        class_id = np.hstack(class_id) if all_not_none(class_id) else None
        tracker_id = np.hstack(tracker_id) if all_not_none(tracker_id) else None

        return cls(
            xyxy=xyxy,
            mask=mask,
            confidence=confidence,
            class_id=class_id,
            tracker_id=tracker_id,
        )

    def get_anchor_coordinates(self, anchor: Position) -> np.ndarray:
        """
        Returns the bounding box coordinates for a specific anchor.

        Args:
            anchor (Position): Position of bounding box anchor for which to return the coordinates.

        Returns:
            np.ndarray: An array of shape `(n, 2)` containing the bounding box anchor coordinates in format `[x, y]`.
        """
        if anchor == Position.CENTER:
            return np.array(
                [
                    (self.xyxy[:, 0] + self.xyxy[:, 2]) / 2,
                    (self.xyxy[:, 1] + self.xyxy[:, 3]) / 2,
                ]
            ).transpose()
        elif anchor == Position.BOTTOM_CENTER:
            return np.array(
                [(self.xyxy[:, 0] + self.xyxy[:, 2]) / 2, self.xyxy[:, 3]]
            ).transpose()

        raise ValueError(f"{anchor} is not supported.")

    def __getitem__(
        self, index: Union[int, slice, List[int], np.ndarray]
    ) -> Detections:
        """
        Get a subset of the Detections object.

        Args:
            index (Union[int, slice, List[int], np.ndarray]): The index or indices of the subset of the Detections

        Returns:
            (Detections): A subset of the Detections object.

        Example:
            ```python
            >>> import supervision as sv

            >>> detections = sv.Detections(...)

            >>> first_detection = detections[0]

            >>> first_10_detections = detections[0:10]

            >>> some_detections = detections[[0, 2, 4]]

            >>> class_0_detections = detections[detections.class_id == 0]

            >>> high_confidence_detections = detections[detections.confidence > 0.5]
            ```
        """
        if isinstance(index, int):
            index = [index]
        return Detections(
            xyxy=self.xyxy[index],
            mask=self.mask[index] if self.mask is not None else None,
            confidence=self.confidence[index] if self.confidence is not None else None,
            class_id=self.class_id[index] if self.class_id is not None else None,
            tracker_id=self.tracker_id[index] if self.tracker_id is not None else None,
        )

    @property
    def area(self) -> np.ndarray:
        """
        Calculate the area of each detection in the set of object detections. If masks field is defined property
        returns are of each mask. If only box is given property return area of each box.

        Returns:
          np.ndarray: An array of floats containing the area of each detection in the format of `(area_1, area_2, ..., area_n)`, where n is the number of detections.
        """
        if self.mask is not None:
            return np.array([np.sum(mask) for mask in self.mask])
        else:
            return self.box_area

    @property
    def box_area(self) -> np.ndarray:
        """
        Calculate the area of each bounding box in the set of object detections.

        Returns:
            np.ndarray: An array of floats containing the area of each bounding box in the format of `(area_1, area_2, ..., area_n)`, where n is the number of detections.
        """
        return (self.xyxy[:, 3] - self.xyxy[:, 1]) * (self.xyxy[:, 2] - self.xyxy[:, 0])

    def with_nms(
        self, threshold: float = 0.5, class_agnostic: bool = False
    ) -> Detections:
        """
        Perform non-maximum suppression on the current set of object detections.

        Args:
            threshold (float, optional): The intersection-over-union threshold to use for non-maximum suppression. Defaults to 0.5.
            class_agnostic (bool, optional): Whether to perform class-agnostic non-maximum suppression. If True, the class_id of each detection will be ignored. Defaults to False.

        Returns:
            Detections: A new Detections object containing the subset of detections after non-maximum suppression.

        Raises:
            AssertionError: If `confidence` is None and class_agnostic is False. If `class_id` is None and class_agnostic is False.
        """
        if len(self) == 0:
            return self

        assert (
            self.confidence is not None
        ), f"Detections confidence must be given for NMS to be executed."

        if class_agnostic:
            predictions = np.hstack((self.xyxy, self.confidence.reshape(-1, 1)))
            indices = non_max_suppression(
                predictions=predictions, iou_threshold=threshold
            )
            return self[indices]

        assert self.class_id is not None, (
            f"Detections class_id must be given for NMS to be executed. If you intended to perform class agnostic "
            f"NMS set class_agnostic=True."
        )

        predictions = np.hstack(
            (self.xyxy, self.confidence.reshape(-1, 1), self.class_id.reshape(-1, 1))
        )
        indices = non_max_suppression(predictions=predictions, iou_threshold=threshold)
        return self[indices]

`area: np.ndarray` `property` ¶

Calculate the area of each detection in the set of object detections. If masks field is defined property returns are of each mask. If only box is given property return area of each box.

Returns:

Type	Description
`ndarray`	np.ndarray: An array of floats containing the area of each detection in the format of `(area_1, area_2, ..., area_n)`, where n is the number of detections.

`box_area: np.ndarray` `property` ¶

Calculate the area of each bounding box in the set of object detections.

Returns:

Type	Description
`ndarray`	np.ndarray: An array of floats containing the area of each bounding box in the format of `(area_1, area_2, ..., area_n)`, where n is the number of detections.

`getitem(index)` ¶

Get a subset of the Detections object.

Parameters:

Name	Type	Description	Default
`index`	`Union[int, slice, List[int], ndarray]`	The index or indices of the subset of the Detections	required

Returns:

Type	Description
`Detections`	A subset of the Detections object.

Example

>>> import supervision as sv

>>> detections = sv.Detections(...)

>>> first_detection = detections[0]

>>> first_10_detections = detections[0:10]

>>> some_detections = detections[[0, 2, 4]]

>>> class_0_detections = detections[detections.class_id == 0]

>>> high_confidence_detections = detections[detections.confidence > 0.5]

Source code in supervision/detection/core.py

def __getitem__(
    self, index: Union[int, slice, List[int], np.ndarray]
) -> Detections:
    """
    Get a subset of the Detections object.

    Args:
        index (Union[int, slice, List[int], np.ndarray]): The index or indices of the subset of the Detections

    Returns:
        (Detections): A subset of the Detections object.

    Example:
        ```python
        >>> import supervision as sv

        >>> detections = sv.Detections(...)

        >>> first_detection = detections[0]

        >>> first_10_detections = detections[0:10]

        >>> some_detections = detections[[0, 2, 4]]

        >>> class_0_detections = detections[detections.class_id == 0]

        >>> high_confidence_detections = detections[detections.confidence > 0.5]
        ```
    """
    if isinstance(index, int):
        index = [index]
    return Detections(
        xyxy=self.xyxy[index],
        mask=self.mask[index] if self.mask is not None else None,
        confidence=self.confidence[index] if self.confidence is not None else None,
        class_id=self.class_id[index] if self.class_id is not None else None,
        tracker_id=self.tracker_id[index] if self.tracker_id is not None else None,
    )

`iter()` ¶

Iterates over the Detections object and yield a tuple of (xyxy, mask, confidence, class_id, tracker_id) for each detection.

Source code in supervision/detection/core.py

def __iter__(
    self,
) -> Iterator[
    Tuple[
        np.ndarray,
        Optional[np.ndarray],
        Optional[float],
        Optional[int],
        Optional[int],
    ]
]:
    """
    Iterates over the Detections object and yield a tuple of `(xyxy, mask, confidence, class_id, tracker_id)` for each detection.
    """
    for i in range(len(self.xyxy)):
        yield (
            self.xyxy[i],
            self.mask[i] if self.mask is not None else None,
            self.confidence[i] if self.confidence is not None else None,
            self.class_id[i] if self.class_id is not None else None,
            self.tracker_id[i] if self.tracker_id is not None else None,
        )

`len()` ¶

Returns the number of detections in the Detections object.

Source code in supervision/detection/core.py

def __len__(self):
    """
    Returns the number of detections in the Detections object.
    """
    return len(self.xyxy)

`empty()` `classmethod` ¶

Create an empty Detections object with no bounding boxes, confidences, or class IDs.

Returns:

Type	Description
`Detections`	An empty Detections object.

Example

>>> from supervision import Detections

>>> empty_detections = Detections.empty()

Source code in supervision/detection/core.py

@classmethod
def empty(cls) -> Detections:
    """
    Create an empty Detections object with no bounding boxes, confidences, or class IDs.

    Returns:
        (Detections): An empty Detections object.

    Example:
        ```python
        >>> from supervision import Detections

        >>> empty_detections = Detections.empty()
        ```
    """
    return cls(
        xyxy=np.empty((0, 4), dtype=np.float32),
        confidence=np.array([], dtype=np.float32),
        class_id=np.array([], dtype=int),
    )

`from_detectron2(detectron2_results)` `classmethod` ¶

Create a Detections object from the Detectron2 inference result.

Parameters:

Name	Type	Description	Default
`detectron2_results`		The output of a Detectron2 model containing instances with prediction data.	required

Returns:

Type	Description
`Detections`	A Detections object containing the bounding boxes, class IDs, and confidences of the predictions.

Example

>>> import cv2
>>> from detectron2.engine import DefaultPredictor
>>> from detectron2.config import get_cfg
>>> import supervision as sv

>>> image = cv2.imread(SOURCE_IMAGE_PATH)
>>> cfg = get_cfg()
>>> cfg.merge_from_file("path/to/config.yaml")
>>> cfg.MODEL.WEIGHTS = "path/to/model_weights.pth"
>>> predictor = DefaultPredictor(cfg)
>>> result = predictor(image)

>>> detections = sv.Detections.from_detectron2(result)

Source code in supervision/detection/core.py

@classmethod
def from_detectron2(cls, detectron2_results) -> Detections:
    """
    Create a Detections object from the [Detectron2](https://github.com/facebookresearch/detectron2) inference result.

    Args:
        detectron2_results: The output of a Detectron2 model containing instances with prediction data.

    Returns:
        (Detections): A Detections object containing the bounding boxes, class IDs, and confidences of the predictions.

    Example:
        ```python
        >>> import cv2
        >>> from detectron2.engine import DefaultPredictor
        >>> from detectron2.config import get_cfg
        >>> import supervision as sv

        >>> image = cv2.imread(SOURCE_IMAGE_PATH)
        >>> cfg = get_cfg()
        >>> cfg.merge_from_file("path/to/config.yaml")
        >>> cfg.MODEL.WEIGHTS = "path/to/model_weights.pth"
        >>> predictor = DefaultPredictor(cfg)
        >>> result = predictor(image)

        >>> detections = sv.Detections.from_detectron2(result)
        ```
    """
    return cls(
        xyxy=detectron2_results["instances"].pred_boxes.tensor.cpu().numpy(),
        confidence=detectron2_results["instances"].scores.cpu().numpy(),
        class_id=detectron2_results["instances"]
        .pred_classes.cpu()
        .numpy()
        .astype(int),
    )

`from_roboflow(roboflow_result, class_list)` `classmethod` ¶

Create a Detections object from the Roboflow API inference result.

Parameters:

Name	Type	Description	Default
`roboflow_result`	`dict`	The result from the Roboflow API containing predictions.	required
`class_list`	`List[str]`	A list of class names corresponding to the class IDs in the API result.	required

Returns:

Type	Description
`Detections`	A Detections object containing the bounding boxes, class IDs, and confidences of the predictions.

Example

>>> import supervision as sv

>>> roboflow_result = {
...     "predictions": [
...         {
...             "x": 0.5,
...             "y": 0.5,
...             "width": 0.2,
...             "height": 0.3,
...             "class": "person",
...             "confidence": 0.9
...         },
...         # ... more predictions ...
...     ]
... }
>>> class_list = ["person", "car", "dog"]

>>> detections = sv.Detections.from_roboflow(roboflow_result, class_list)

Source code in supervision/detection/core.py

@classmethod
def from_roboflow(cls, roboflow_result: dict, class_list: List[str]) -> Detections:
    """
    Create a Detections object from the [Roboflow](https://roboflow.com/) API inference result.

    Args:
        roboflow_result (dict): The result from the Roboflow API containing predictions.
        class_list (List[str]): A list of class names corresponding to the class IDs in the API result.

    Returns:
        (Detections): A Detections object containing the bounding boxes, class IDs, and confidences of the predictions.

    Example:
        ```python
        >>> import supervision as sv

        >>> roboflow_result = {
        ...     "predictions": [
        ...         {
        ...             "x": 0.5,
        ...             "y": 0.5,
        ...             "width": 0.2,
        ...             "height": 0.3,
        ...             "class": "person",
        ...             "confidence": 0.9
        ...         },
        ...         # ... more predictions ...
        ...     ]
        ... }
        >>> class_list = ["person", "car", "dog"]

        >>> detections = sv.Detections.from_roboflow(roboflow_result, class_list)
        ```
    """
    xyxy = []
    confidence = []
    class_id = []

    for prediction in roboflow_result["predictions"]:
        x = prediction["x"]
        y = prediction["y"]
        width = prediction["width"]
        height = prediction["height"]
        x_min = x - width / 2
        y_min = y - height / 2
        x_max = x_min + width
        y_max = y_min + height
        xyxy.append([x_min, y_min, x_max, y_max])
        class_id.append(class_list.index(prediction["class"]))
        confidence.append(prediction["confidence"])

    return Detections(
        xyxy=np.array(xyxy),
        confidence=np.array(confidence),
        class_id=np.array(class_id).astype(int),
    )

`from_sam(sam_result)` `classmethod` ¶

Creates a Detections instance from Segment Anything Model inference result.

Parameters:

Name	Type	Description	Default
`sam_result`	`List[dict]`	The output Results instance from SAM	required

Returns:

Name	Type	Description
`Detections`	`Detections`	A new Detections object.

Example

>>> import supervision as sv
>>> from segment_anything import sam_model_registry, SamAutomaticMaskGenerator

>>> sam = sam_model_registry[MODEL_TYPE](checkpoint=CHECKPOINT_PATH).to(device=DEVICE)
>>> mask_generator = SamAutomaticMaskGenerator(sam)
>>> sam_result = mask_generator.generate(IMAGE)
>>> detections = sv.Detections.from_sam(sam_result=sam_result)

Source code in supervision/detection/core.py

@classmethod
def from_sam(cls, sam_result: List[dict]) -> Detections:
    """
    Creates a Detections instance from [Segment Anything Model](https://github.com/facebookresearch/segment-anything) inference result.

    Args:
        sam_result (List[dict]): The output Results instance from SAM

    Returns:
        Detections: A new Detections object.

    Example:
        ```python
        >>> import supervision as sv
        >>> from segment_anything import sam_model_registry, SamAutomaticMaskGenerator

        >>> sam = sam_model_registry[MODEL_TYPE](checkpoint=CHECKPOINT_PATH).to(device=DEVICE)
        >>> mask_generator = SamAutomaticMaskGenerator(sam)
        >>> sam_result = mask_generator.generate(IMAGE)
        >>> detections = sv.Detections.from_sam(sam_result=sam_result)
        ```
    """
    sorted_generated_masks = sorted(
        sam_result, key=lambda x: x["area"], reverse=True
    )

    xywh = np.array([mask["bbox"] for mask in sorted_generated_masks])
    mask = np.array([mask["segmentation"] for mask in sorted_generated_masks])

    return Detections(xyxy=xywh_to_xyxy(boxes_xywh=xywh), mask=mask)

`from_transformers(transformers_results)` `classmethod` ¶

Creates a Detections instance from object detection transformer inference result.

Returns:

Name	Type	Description
`Detections`	`Detections`	A new Detections object.

Source code in supervision/detection/core.py

@classmethod
def from_transformers(cls, transformers_results: dict) -> Detections:
    """
    Creates a Detections instance from object detection [transformer](https://github.com/huggingface/transformers) inference result.

    Returns:
        Detections: A new Detections object.
    """
    return cls(
        xyxy=transformers_results["boxes"].cpu().numpy(),
        confidence=transformers_results["scores"].cpu().numpy(),
        class_id=transformers_results["labels"].cpu().numpy().astype(int),
    )

`from_yolo_nas(yolo_nas_results)` `classmethod` ¶

Creates a Detections instance from a YOLO-NAS inference result.

Parameters:

Name	Type	Description	Default
`yolo_nas_results`	`ImageDetectionPrediction`	The output Results instance from YOLO-NAS	required

Returns:

Name	Type	Description
`Detections`	`Detections`	A new Detections object.

Example

>>> import cv2
>>> from super_gradients.training import models
>>> import supervision as sv

>>> image = cv2.imread(SOURCE_IMAGE_PATH)
>>> model = models.get('yolo_nas_l', pretrained_weights="coco")
>>> result = list(model.predict(image, conf=0.35))[0]
>>> detections = sv.Detections.from_yolo_nas(result)

Source code in supervision/detection/core.py

@classmethod
def from_yolo_nas(cls, yolo_nas_results) -> Detections:
    """
    Creates a Detections instance from a [YOLO-NAS](https://github.com/Deci-AI/super-gradients/blob/master/YOLONAS.md) inference result.

    Args:
        yolo_nas_results (super_gradients.training.models.prediction_results.ImageDetectionPrediction): The output Results instance from YOLO-NAS

    Returns:
        Detections: A new Detections object.

    Example:
        ```python
        >>> import cv2
        >>> from super_gradients.training import models
        >>> import supervision as sv

        >>> image = cv2.imread(SOURCE_IMAGE_PATH)
        >>> model = models.get('yolo_nas_l', pretrained_weights="coco")
        >>> result = list(model.predict(image, conf=0.35))[0]
        >>> detections = sv.Detections.from_yolo_nas(result)
        ```
    """
    return cls(
        xyxy=yolo_nas_results.prediction.bboxes_xyxy,
        confidence=yolo_nas_results.prediction.confidence,
        class_id=yolo_nas_results.prediction.labels.astype(int),
    )

`from_yolov5(yolov5_results)` `classmethod` ¶

Creates a Detections instance from a YOLOv5 inference result.

Parameters:

Name	Type	Description	Default
`yolov5_results`	`Detections`	The output Detections instance from YOLOv5	required

Returns:

Name	Type	Description
`Detections`	`Detections`	A new Detections object.

Example

>>> import cv2
>>> import torch
>>> import supervision as sv

>>> image = cv2.imread(SOURCE_IMAGE_PATH)
>>> model = torch.hub.load('ultralytics/yolov5', 'yolov5s')
>>> result = model(image)
>>> detections = sv.Detections.from_yolov5(result)

Source code in supervision/detection/core.py

@classmethod
def from_yolov5(cls, yolov5_results) -> Detections:
    """
    Creates a Detections instance from a [YOLOv5](https://github.com/ultralytics/yolov5) inference result.

    Args:
        yolov5_results (yolov5.models.common.Detections): The output Detections instance from YOLOv5

    Returns:
        Detections: A new Detections object.

    Example:
        ```python
        >>> import cv2
        >>> import torch
        >>> import supervision as sv

        >>> image = cv2.imread(SOURCE_IMAGE_PATH)
        >>> model = torch.hub.load('ultralytics/yolov5', 'yolov5s')
        >>> result = model(image)
        >>> detections = sv.Detections.from_yolov5(result)
        ```
    """
    yolov5_detections_predictions = yolov5_results.pred[0].cpu().cpu().numpy()
    return cls(
        xyxy=yolov5_detections_predictions[:, :4],
        confidence=yolov5_detections_predictions[:, 4],
        class_id=yolov5_detections_predictions[:, 5].astype(int),
    )

`from_yolov8(yolov8_results)` `classmethod` ¶

Creates a Detections instance from a YOLOv8 inference result.

Parameters:

Name	Type	Description	Default
`yolov8_results`	`Results`	The output Results instance from YOLOv8	required

Returns:

Name	Type	Description
`Detections`	`Detections`	A new Detections object.

Example

>>> import cv2
>>> from ultralytics import YOLO
>>> import supervision as sv

>>> image = cv2.imread(SOURCE_IMAGE_PATH)
>>> model = YOLO('yolov8s.pt')
>>> result = model(image)[0]
>>> detections = sv.Detections.from_yolov8(result)

Source code in supervision/detection/core.py

@classmethod
def from_yolov8(cls, yolov8_results) -> Detections:
    """
    Creates a Detections instance from a [YOLOv8](https://github.com/ultralytics/ultralytics) inference result.

    Args:
        yolov8_results (ultralytics.yolo.engine.results.Results): The output Results instance from YOLOv8

    Returns:
        Detections: A new Detections object.

    Example:
        ```python
        >>> import cv2
        >>> from ultralytics import YOLO
        >>> import supervision as sv

        >>> image = cv2.imread(SOURCE_IMAGE_PATH)
        >>> model = YOLO('yolov8s.pt')
        >>> result = model(image)[0]
        >>> detections = sv.Detections.from_yolov8(result)
        ```
    """
    return cls(
        xyxy=yolov8_results.boxes.xyxy.cpu().numpy(),
        confidence=yolov8_results.boxes.conf.cpu().numpy(),
        class_id=yolov8_results.boxes.cls.cpu().numpy().astype(int),
        mask=extract_yolov8_masks(yolov8_results),
    )

`get_anchor_coordinates(anchor)` ¶

Returns the bounding box coordinates for a specific anchor.

Parameters:

Name	Type	Description	Default
`anchor`	`Position`	Position of bounding box anchor for which to return the coordinates.	required

Returns:

Type	Description
`ndarray`	np.ndarray: An array of shape `(n, 2)` containing the bounding box anchor coordinates in format `[x, y]`.

Source code in supervision/detection/core.py

def get_anchor_coordinates(self, anchor: Position) -> np.ndarray:
    """
    Returns the bounding box coordinates for a specific anchor.

    Args:
        anchor (Position): Position of bounding box anchor for which to return the coordinates.

    Returns:
        np.ndarray: An array of shape `(n, 2)` containing the bounding box anchor coordinates in format `[x, y]`.
    """
    if anchor == Position.CENTER:
        return np.array(
            [
                (self.xyxy[:, 0] + self.xyxy[:, 2]) / 2,
                (self.xyxy[:, 1] + self.xyxy[:, 3]) / 2,
            ]
        ).transpose()
    elif anchor == Position.BOTTOM_CENTER:
        return np.array(
            [(self.xyxy[:, 0] + self.xyxy[:, 2]) / 2, self.xyxy[:, 3]]
        ).transpose()

    raise ValueError(f"{anchor} is not supported.")

`merge(detections_list)` `classmethod` ¶

Merge a list of Detections objects into a single Detections object.

This method takes a list of Detections objects and combines their respective fields (xyxy, mask, confidence, class_id, and tracker_id) into a single Detections object. If all elements in a field are not None, the corresponding field will be stacked. Otherwise, the field will be set to None.

Parameters:

Name	Type	Description	Default
`detections_list`	`List[Detections]`	A list of Detections objects to merge.	required

Returns:

Type	Description
`Detections`	A single Detections object containing the merged data from the input list.

Example

>>> from supervision import Detections

>>> detections_1 = Detections(...)
>>> detections_2 = Detections(...)

>>> merged_detections = Detections.merge([detections_1, detections_2])

Source code in supervision/detection/core.py

@classmethod
def merge(cls, detections_list: List[Detections]) -> Detections:
    """
    Merge a list of Detections objects into a single Detections object.

    This method takes a list of Detections objects and combines their respective fields (`xyxy`, `mask`,
    `confidence`, `class_id`, and `tracker_id`) into a single Detections object. If all elements in a field are not
    `None`, the corresponding field will be stacked. Otherwise, the field will be set to `None`.

    Args:
        detections_list (List[Detections]): A list of Detections objects to merge.

    Returns:
        (Detections): A single Detections object containing the merged data from the input list.

    Example:
        ```python
        >>> from supervision import Detections

        >>> detections_1 = Detections(...)
        >>> detections_2 = Detections(...)

        >>> merged_detections = Detections.merge([detections_1, detections_2])
        ```
    """
    if len(detections_list) == 0:
        return Detections.empty()

    detections_tuples_list = [astuple(detection) for detection in detections_list]
    xyxy, mask, confidence, class_id, tracker_id = [
        list(field) for field in zip(*detections_tuples_list)
    ]

    all_not_none = lambda l: all(x is not None for x in l)

    xyxy = np.vstack(xyxy)
    mask = np.vstack(mask) if all_not_none(mask) else None
    confidence = np.hstack(confidence) if all_not_none(confidence) else None
    class_id = np.hstack(class_id) if all_not_none(class_id) else None
    tracker_id = np.hstack(tracker_id) if all_not_none(tracker_id) else None

    return cls(
        xyxy=xyxy,
        mask=mask,
        confidence=confidence,
        class_id=class_id,
        tracker_id=tracker_id,
    )

`with_nms(threshold=0.5, class_agnostic=False)` ¶

Perform non-maximum suppression on the current set of object detections.

Parameters:

Name	Type	Description	Default
`threshold`	`float`	The intersection-over-union threshold to use for non-maximum suppression. Defaults to 0.5.	`0.5`
`class_agnostic`	`bool`	Whether to perform class-agnostic non-maximum suppression. If True, the class_id of each detection will be ignored. Defaults to False.	`False`

Returns:

Name	Type	Description
`Detections`	`Detections`	A new Detections object containing the subset of detections after non-maximum suppression.

Raises:

Type	Description
`AssertionError`	If `confidence` is None and class_agnostic is False. If `class_id` is None and class_agnostic is False.

Source code in supervision/detection/core.py

def with_nms(
    self, threshold: float = 0.5, class_agnostic: bool = False
) -> Detections:
    """
    Perform non-maximum suppression on the current set of object detections.

    Args:
        threshold (float, optional): The intersection-over-union threshold to use for non-maximum suppression. Defaults to 0.5.
        class_agnostic (bool, optional): Whether to perform class-agnostic non-maximum suppression. If True, the class_id of each detection will be ignored. Defaults to False.

    Returns:
        Detections: A new Detections object containing the subset of detections after non-maximum suppression.

    Raises:
        AssertionError: If `confidence` is None and class_agnostic is False. If `class_id` is None and class_agnostic is False.
    """
    if len(self) == 0:
        return self

    assert (
        self.confidence is not None
    ), f"Detections confidence must be given for NMS to be executed."

    if class_agnostic:
        predictions = np.hstack((self.xyxy, self.confidence.reshape(-1, 1)))
        indices = non_max_suppression(
            predictions=predictions, iou_threshold=threshold
        )
        return self[indices]

    assert self.class_id is not None, (
        f"Detections class_id must be given for NMS to be executed. If you intended to perform class agnostic "
        f"NMS set class_agnostic=True."
    )

    predictions = np.hstack(
        (self.xyxy, self.confidence.reshape(-1, 1), self.class_id.reshape(-1, 1))
    )
    indices = non_max_suppression(predictions=predictions, iou_threshold=threshold)
    return self[indices]

Core

Detections¶

area: np.ndarray property ¶

box_area: np.ndarray property ¶

__getitem__(index) ¶

__iter__() ¶

__len__() ¶

empty() classmethod ¶

from_detectron2(detectron2_results) classmethod ¶

from_roboflow(roboflow_result, class_list) classmethod ¶

from_sam(sam_result) classmethod ¶

from_transformers(transformers_results) classmethod ¶

from_yolo_nas(yolo_nas_results) classmethod ¶

from_yolov5(yolov5_results) classmethod ¶

from_yolov8(yolov8_results) classmethod ¶

get_anchor_coordinates(anchor) ¶

merge(detections_list) classmethod ¶

with_nms(threshold=0.5, class_agnostic=False) ¶

`area: np.ndarray` `property` ¶

`box_area: np.ndarray` `property` ¶

`getitem(index)` ¶

`iter()` ¶

`len()` ¶

`empty()` `classmethod` ¶

`from_detectron2(detectron2_results)` `classmethod` ¶

`from_roboflow(roboflow_result, class_list)` `classmethod` ¶

`from_sam(sam_result)` `classmethod` ¶

`from_transformers(transformers_results)` `classmethod` ¶

`from_yolo_nas(yolo_nas_results)` `classmethod` ¶

`from_yolov5(yolov5_results)` `classmethod` ¶

`from_yolov8(yolov8_results)` `classmethod` ¶

`get_anchor_coordinates(anchor)` ¶

`merge(detections_list)` `classmethod` ¶

`with_nms(threshold=0.5, class_agnostic=False)` ¶