Source code for mil_vision_tools.shape_finder

#!/usr/bin/env python3
from __future__ import annotations

from typing import Any

import cv2
import numpy as np
from geometry_msgs.msg import Polygon
from image_geometry import PinholeCameraModel
from mil_ros_tools.msg_helpers import numpy_to_polygon, rosmsg_to_numpy

__author__ = "Kevin Allen"


[docs]class RectFinder:
    """
    Keeps a model of a rectangle in meters, providing utility functions
    to find 2D and 3D pose estimations of rectangles matching this model
    found in a computer vision program.

    Attributes:
        length (float): The measurement of the longer side of the rectangle, in meters.
        width (float): The measurement of the shorter side of the rectangle, in meters.
        model_3D (np.ndarray): The internal model of the three-dimensional rectangle.
    """

    def __init__(self, length: float = 1.0, width: float = 1.0):
        """
        Initializes the internal model of the rectangle. If width > length, the
        two will be reversed so that length is always the longer side.

        Args:
            length (float): The measurement of the longer side of the rectangle
                in meters.
            width (float): The measurement of the shorter side of the rectangle
                in meters.
        """
        # Ensure length >= width
        self.width, self.length = tuple(np.sort([length, width]))
        self.model_3D = np.array(
            [
                [self.length / 2.0, -self.width / 2.0, 0],
                [self.length / 2.0, self.width / 2.0, 0],
                [-self.length / 2.0, self.width / 2.0, 0],
                [-self.length / 2.0, -self.width / 2.0, 0],
            ],
            dtype=np.float,
        )

        scale = (
            10000 / self.length
        )  # Scale 2D model to maintain precision when converting to int
        self.model_2D = np.array(
            [
                [[0, 0]],
                [[self.width * scale, 0]],
                [[self.width * scale, self.length * scale]],
                [[0, self.length * scale]],
            ],
            dtype=np.int,
        )

[docs]    @classmethod
    def from_polygon(cls, polygon: Polygon) -> RectFinder:
        """
        Creates a RectFinder from a ``geometry_msgs/Polygon`` message.

        The length of the class becomes the range of x/y (whichever larger). The width
        becomes the range of x/y (whichever shorter).

        Args:
            polygon (:class:`~geometry_msgs.msg._Polygon.Polygon`): The polygon to construct
                the class from.

        Raises:
            AssertionError: The polygon parameter is not an instance of :class:`~geometry_msgs.msg._Polygon.Polygon`.

        Returns:
            RectFinder: A new instance of the class.
        """
        assert isinstance(polygon, Polygon)
        arr = rosmsg_to_numpy(polygon.points)
        # If it contains just one point, treat the x/y and length/width
        if arr.shape[0] == 1:
            return cls(arr[:, 0][0], arr[:, 1][0])
        else:
            return cls(np.ptp(arr[:, 0]), np.ptp(arr[:, 1]))

[docs]    def to_polygon(self) -> Polygon:
        """
        Returns a ``geometry_msgs/Polygon`` instance representing the four corners
        of the rectangle where all ``z = 0``.

        Returns:
            Polygon: A constructed message.
        """
        return numpy_to_polygon(self.model_3D)

[docs]    @staticmethod
    def sort_corners(rect: np.ndarray, debug_image: bool | None = None) -> np.ndarray:
        """
        Given a contour of 4 points, returns the same 4 points sorted in a known way.
        Used so that indices of contour line up to that in model for cv2.solvePnp

        Args:
            rect (np.ndarray): An array representing the contour of 4 points.
            debug_image (Optional[bool]): If not None, puts a circle and text
                of the index in each corner.

        .. code-block::

            p[0] = Top left corner         0--1     1--------2
            p[1] = Top right corner        |  |  or |        |
            p[2] = Bottom right corner     |  |     0--------3
            p[3] = Bottom left corner      3--2
        """
        # Credit to David Soto for this implementation.
        # Work with both (n, 1, 2) and (n, 2) shaped contour representations
        if rect.shape != (rect.shape[0], 2):
            M = cv2.moments(rect)
            rect = np.reshape(rect, (rect.shape[0], 2))
        else:
            temp = rect.reshape(rect.shape[0], 1, 2)
            M = cv2.moments(temp)
        centroid = np.array((int(M["m10"] / M["m00"]), int(M["m01"] / M["m00"])))
        vectors = rect - centroid
        atan = np.arctan2(vectors[:, 1], vectors[:, 0])
        atan_indicies = np.argsort(atan)
        # Sort by arctan formed by vector from centroid to each point
        rect = rect[atan_indicies]
        # If rect is horizontal, correct indices as noted above
        if np.linalg.norm(rect[0] - rect[1]) > np.linalg.norm(rect[0] - rect[3]):
            rect = rect[[3, 0, 1, 2]]
        # Print indices onto image if debug_image is given
        if debug_image is not None:
            for i, pixel in enumerate(rect):
                center = (int(pixel[0]), int(pixel[1]))
                cv2.circle(debug_image, center, 5, (0, 255, 0), -1)
                cv2.putText(
                    debug_image,
                    str(i),
                    center,
                    cv2.FONT_HERSHEY_SCRIPT_COMPLEX,
                    1,
                    (0, 0, 255),
                )
        return rect

[docs]    def verify_contour(self, contour: np.ndarray) -> Any:
        """
        Returns a numerical comparison between a contour and the perfect
        model of the rectangle. A perfectly matched contour returns 0.0.

        Useful for filtering contours.
        """
        return cv2.matchShapes(contour, self.model_2D, 3, 0.0)

[docs]    def get_corners(
        self,
        contour: np.ndarray,
        debug_image: bool | None = None,
        epsilon_range: tuple[float, float] = (0.01, 0.1),
        epsilon_step: float = 0.01,
    ) -> np.ndarray | None:
        """
        Attempts to find the 4 corners of a contour representing a quadrilateral.

        If the corners are found, it returns these 4 points sorted as described
        in :meth:`.sort_corners`. These corners can be used for :meth:`.get_pose_2D`
        and :meth:`.get_pose_3D`.

        If a 4 sided polygon cannot be approximated, returns ``None``.

        Args:
            contour (np.ndarray): The contour of the image.
            debug_image (Optional[bool]): If not ``None``, will draw corners with
                text for indexes onto image.
            epsilon_range (Tuple[float, float]): Tuple of two epsilon values (factor
                of contour arclength) to try for polygon approx.
            epsilon_step (float): How much to increment epsilon each time while
                iterating through epsilon_range.

        Returns:
            Optional[np.ndarray]: The array, if it can be approximated.
        """
        # Credit David Soto for idea to iterate through multiple epsilon values
        arclength = cv2.arcLength(contour, True)
        epsilon = epsilon_range[0]
        while epsilon <= epsilon_range[1]:
            polygon = cv2.approxPolyDP(contour, epsilon * arclength, True)
            if len(polygon) == 4:
                return self.sort_corners(polygon, debug_image=debug_image)
            epsilon += epsilon_step
        return None

[docs]    def get_pose_3D(
        self,
        corners: np.ndarray,
        intrinsics: np.ndarray | None = None,
        dist_coeffs: np.ndarray | None = None,
        cam: PinholeCameraModel | None = None,
        rectified: bool = False,
    ) -> tuple[Any, Any]:
        """
        Uses the model of the object, the corresponding pixels in the image, and camera
        intrinsics to estimate a 3D pose of the object.

        Either ``cam`` and ``rectified`` must be provided, or ``intrinsics`` and ``dist_coeffs``.

        Args:
            corners (np.ndarray): 4x2 numpy array from :meth:`.get_corners` representing
                the 4 sorted corners in the image.
            cam (Optional[PinholeCameraModel]): The camera model.
            rectified (bool): If ``cam`` is set, set True if corners were found in an
               already rectified image (image_rect_color topic).
            intrinsics (np.ndarray): Camera intrinisic matrix.
            dist_coeffs (np.ndarray): Camera distortion coefficients.

        Returns:
            Tuple[Any, Any]: Represents the translation and rotation vector between
            the camera and the object in meters/radians. Use cv2.Rodrigues to convert
            ``rvec`` to a 3x3 rotation matrix.
        """
        corners = np.array(corners, dtype=np.float)
        # Use camera intrinsics and knowledge of marker's real dimensions to
        # get a pose estimate in camera frame
        if cam is not None:
            intrinsics = cam.intrinsicMatrix()
            dist_coeffs = np.zeros((5, 1)) if rectified else cam.distortionCoeffs()
        assert intrinsics is not None
        assert dist_coeffs is not None
        _, rvec, tvec = cv2.solvePnP(self.model_3D, corners, intrinsics, dist_coeffs)
        return (tvec, rvec)

[docs]    def get_pose_2D(self, corners: np.ndarray) -> tuple[Any, Any]:
        """
        Finds the 2D center of the rectangle and a unit direction vector along the length
        of the rectangle in pixels....

        Args:
            corners (np.ndarray): 4x2 numpy array from :meth:`.get_corners` representing
            the 4 sorted corners in the image.

        Returns:
            Tuple[Any, Any]: A tuple representing ``(center, vector)``.
        """
        top_center = (corners[1] + corners[0]) / 2.0
        bot_center = (corners[2] + corners[3]) / 2.0
        vector = top_center - bot_center
        vector = vector / np.linalg.norm(vector)
        center = bot_center + (top_center - bot_center) / 2.0
        vector = top_center - bot_center
        vector = vector / np.linalg.norm(vector)
        return (center, vector)

[docs]    def draw_model(
        self,
        size: tuple[int, int] = (500, 500),
        border: int = 25,
    ) -> np.ndarray:
        """
        Returns a 1 channel image displaying the internal model of the rectangle.
        Useful for visually checking that your model is reasonable. Also useful
        to see what orientation of a contour will be considered 0 rotation in :meth:`.get_pose_3D`.

        Args:
            size (Tuple[int, int]): A 2 element tuple of ``(x, y)``, which will
                be the resolution of the returned image.
            border (int): Size of the border, in pixels, around the model
                contour in the returned image.

        Returns:
            np.ndarray: A one channel image with shape specified by size param with internal model
            drawn in white surrounded by a black border
        """
        size = np.array(size)
        scale = float(min(size)) / np.max(self.model_2D)
        model = np.array(border + (scale * self.model_2D), dtype=np.int)
        img = np.zeros(2 * border + size, dtype=np.uint8)
        cv2.drawContours(img, [model], 0, (255), 3)
        return img


class EllipseFinder(RectFinder):
    """
    Class to test contours in images for being close to an ellipse
    matching a given model. Uses RectFinder on well matched
    contours to get 3D pose estimates.

    Can be used just as RectFinder is used, but contours passed to verify_contour
    will be evaluated based on their similarity to an ellipse, not a rectangle.
    The get_corners function will return the corners of the least area rotated
    rectangle around the ellipse contour, so 3D pose estimation will still work.
    """

    def __init__(self, length=1.0, width=1.0):
        """
        Create internal model for an ellipse.
        """
        super().__init__(length, width)

        # Correct 2D model to be an oval to that verify_contour works
        scale = 1000.0 / self.length
        self.model_2D = np.zeros((50, 1, 2), dtype=np.int)
        # Approximate an ellipse with 50 points, so that verify_contour is reasonable fast still
        for idx, theta in enumerate(np.linspace(0.0, 2.0 * np.pi, num=50)):
            self.model_2D[idx][0][0] = (
                self.length * 0.5 * scale + self.length * 0.5 * scale * np.cos(theta)
            )
            self.model_2D[idx][0][1] = (
                self.width * 0.5 * scale + self.width * 0.5 * scale * np.sin(theta)
            )

    def get_corners(self, contour, debug_image=None):
        """
        Override get corner function for Ellipses to approximate an ellipse
        instead of a four sided polygon around the contour.
        """
        ellipse = cv2.fitEllipse(contour)
        points = np.array(cv2.boxPoints(ellipse), dtype=np.int32).reshape(4, 1, 2)
        return self.sort_corners(points, debug_image=debug_image)


class CircleFinder(EllipseFinder):
    """
    Cute abstraction for circles, which are just ellipses with the same
    length and width. See EllipseFinder for usage.
    """

    def __init__(self, radius, _=None):
        super().__init__(radius, radius)