Source code for n_fold_edge.marker_locator

"""Locate a marker of given order in image."""

import math
import traceback
from collections.abc import Sequence

import cv2
import numpy as np

from n_fold_edge.marker_pose import MarkerPose



[docs]
class MarkerLocator:
    """
    Locate a marker in an image.

    Parameters
    ----------
    order : int
        The order type of the marker to locate.
    kernel_size : int
        Kernel size to use for detecting the marker.
    scale_factor : float
        Scale factor to use for detecting the marker.
    """

    def __init__(self, order: int, kernel_size: int = 55, scale_factor: float = 1000) -> None:
        self.order = order
        self.kernel_size = kernel_size
        (kernel_real, kernel_imag) = self._generate_symmetry_detector_kernel(order, kernel_size)
        self.mat_real = kernel_real / scale_factor
        self.mat_imag = kernel_imag / scale_factor
        self.frame_real: np.ndarray
        self.frame_imag: np.ndarray
        self.track_marker_with_missing_black_leg = True
        # Create kernel used to remove arm in quality-measure
        (kernel_remove_arm_real, kernel_remove_arm_imag) = self._generate_symmetry_detector_kernel(1, self.kernel_size)
        self.kernelComplex = np.array(kernel_real + 1j * kernel_imag, dtype=complex)
        self.KernelRemoveArmComplex = np.array(kernel_remove_arm_real + 1j * kernel_remove_arm_imag, dtype=complex)
        # Values used in quality-measure
        self.threshold = 0.4 * np.absolute(self.kernelComplex).max()
        self.y1 = int(math.floor(float(self.kernel_size) / 2))
        self.y2 = int(math.ceil(float(self.kernel_size) / 2))
        self.x1 = int(math.floor(float(self.kernel_size) / 2))
        self.x2 = int(math.ceil(float(self.kernel_size) / 2))

    @staticmethod
    def _generate_symmetry_detector_kernel(order: int, kernel_size: int) -> tuple[np.ndarray, np.ndarray]:
        value_range = np.linspace(-1, 1, kernel_size)
        temp1 = np.meshgrid(value_range, value_range)
        kernel = temp1[0] + 1j * temp1[1]
        magnitude = abs(kernel)
        kernel = np.power(kernel, order)
        kernel = kernel * np.exp(-8 * magnitude**2)
        return np.real(kernel), np.imag(kernel)

    def _refine_marker_location(self, marker_location: Sequence[int]) -> tuple[float, float]:
        try:
            delta = 1
            # Fit a parabola to the frame_sum_squared marker response
            # and then locate the top of the parabola.
            x = marker_location[1]
            y = marker_location[0]
            frame_sum_squared_cutout = self.frame_sum_squared[x - delta : x + delta + 1, y - delta : y + delta + 1]
            # Taking the square root of the frame_sum_squared improves the accuracy of the
            # refined marker position.
            frame_sum_squared_cutout = np.sqrt(frame_sum_squared_cutout)
            nx, ny = (1 + 2 * delta, 1 + 2 * delta)
            x = np.linspace(-delta, delta, nx)
            y = np.linspace(-delta, delta, ny)
            xv, yv = np.meshgrid(x, y)
            xv = xv.ravel()
            yv = yv.ravel()
            # a*xv^2 + b*xv + c*yv^2 + d*yv + e*xv*yv + f
            coefficients = np.concatenate([[xv**2], [xv], [yv**2], [yv], [xv * yv], [yv**0]], axis=0).transpose()
            values = frame_sum_squared_cutout.ravel().reshape(-1, 1)
            solution, _, _, _ = np.linalg.lstsq(coefficients, values, rcond=None)
            solution = solution.squeeze()
            dx_init = -solution[1] / (2 * solution[0])
            dy_init = -solution[3] / (2 * solution[2])
            dx = -(solution[1] + solution[4] * dy_init) / (2 * solution[0])
            dy = -(solution[3] + solution[4] * dx_init) / (2 * solution[2])
            return dx, dy
        except np.linalg.LinAlgError:
            # This error is triggered when the marker is detected close to an edge.
            # In that case the refine method bails out and returns two zeros.
            return 0, 0


[docs]
    def apply_convolution_with_complex_kernel(self, frame: np.ndarray) -> np.ndarray:
        """
        Get the response from applying the convolution of a complex kernel on an image.

        Parameters
        ----------
        frame : ndarray
            Image or frame of a marker.

        Returns
        -------
        response : ndarray
            Result of applying the convolution of a complex kernel.
        """
        assert len(frame.shape) == 2, "Input image is not a single channel image."
        self.frame_real = frame.copy()
        self.frame_imag = frame.copy()
        # Calculate convolution and determine response strength.
        self.frame_real = cv2.filter2D(self.frame_real, cv2.CV_32F, self.mat_real)
        self.frame_imag = cv2.filter2D(self.frame_imag, cv2.CV_32F, self.mat_imag)
        frame_real_squared = cv2.multiply(self.frame_real, self.frame_real, dtype=cv2.CV_32F)
        frame_imag_squared = cv2.multiply(self.frame_imag, self.frame_imag, dtype=cv2.CV_32F)
        self.frame_sum_squared = cv2.add(frame_real_squared, frame_imag_squared, dtype=cv2.CV_32F)
        return self.frame_sum_squared



[docs]
    def locate_marker(self, frame: np.ndarray) -> MarkerPose:
        """
        Locate the marker with in the frame.

        Parameters
        ----------
        frame : ndarray
            A frame or image with the marker to locate.
        """
        self.frame_sum_squared = self.apply_convolution_with_complex_kernel(frame)
        _, _, _, max_loc = cv2.minMaxLoc(self.frame_sum_squared)
        orientation = self._determine_marker_orientation(frame, max_loc)
        quality = self._determine_marker_quality(frame, max_loc, orientation)
        dx, dy = self._refine_marker_location(max_loc)
        marker_location = (max_loc[0] + dx, max_loc[1] + dy)
        return MarkerPose(marker_location[0], marker_location[1], orientation, quality, self.order)


    def _determine_marker_orientation(self, frame: np.ndarray, marker_location: Sequence[int]) -> float:
        (xm, ym) = marker_location
        real_value = self.frame_real[ym, xm]
        imag_value = self.frame_imag[ym, xm]
        orientation = (math.atan2(-real_value, imag_value) - math.pi / 2) / self.order
        max_value = 0
        max_orientation = orientation
        search_distance = self.kernel_size / 3
        for k in range(self.order):
            orient = orientation + 2 * k * math.pi / self.order
            xm2 = int(xm + search_distance * math.cos(orient))
            ym2 = int(ym + search_distance * math.sin(orient))
            try:
                intensity = frame[ym2, xm2]
                if intensity > max_value:
                    max_value = intensity
                    max_orientation = orient
            except IndexError:
                pass
            except Exception as e:
                traceback.print_exception(e)
                pass
        return self._limit_angle_to_range(max_orientation)

    @staticmethod
    def _limit_angle_to_range(angle: float) -> float:
        while angle < math.pi:
            angle += 2 * math.pi
        while angle > math.pi:
            angle -= 2 * math.pi
        return angle

    def _determine_marker_quality(self, frame: np.ndarray, marker_location: Sequence[int], orientation: float) -> float:
        (bright_regions, dark_regions) = self._generate_template_for_quality_estimator(orientation)
        try:
            frame_img = self._extract_window_around_maker_location(frame, marker_location)
            if frame_img.shape != bright_regions.shape or frame_img.shape != dark_regions.shape:
                return 0.0
            (bright_mean, bright_std) = cv2.meanStdDev(frame_img, mask=bright_regions)
            (dark_mean, dark_std) = cv2.meanStdDev(frame_img, mask=dark_regions)
            mean_difference = np.squeeze(bright_mean - dark_mean)
            normalized_mean_difference = np.squeeze(mean_difference / (0.5 * bright_std + 0.5 * dark_std))
            # Ugly hack for translating the normalized_mean_differences to the range [0, 1]
            temp_value_for_quality = 1 - 1 / (1 + math.exp(0.75 * (-7 + normalized_mean_difference)))
            return temp_value_for_quality
        except Exception as e:
            traceback.print_exception(e)
            return 0.0

    def _extract_window_around_maker_location(self, frame: np.ndarray, marker_location: Sequence[int]) -> np.ndarray:
        xm, ym = marker_location
        frame_tmp = np.array(frame[ym - self.y1 : ym + self.y2, xm - self.x1 : xm + self.x2])
        frame_img = frame_tmp.astype(np.uint8)
        return frame_img

    def _generate_template_for_quality_estimator(self, orientation: float) -> tuple[np.ndarray, np.ndarray]:
        phase = np.exp((self._limit_angle_to_range(-orientation)) * 1j)
        angle_threshold = 3.14 / (2 * self.order)
        t3 = np.angle(self.KernelRemoveArmComplex * phase) < angle_threshold
        t4 = np.angle(self.KernelRemoveArmComplex * phase) > -angle_threshold
        signed_mask = 1 - 2 * (t3 & t4)
        adjusted_kernel = self.kernelComplex * np.power(phase, self.order)
        if self.track_marker_with_missing_black_leg:
            adjusted_kernel *= signed_mask
        bright_regions = (adjusted_kernel.real < -self.threshold).astype(np.uint8)
        dark_regions = (adjusted_kernel.real > self.threshold).astype(np.uint8)
        return bright_regions, dark_regions