src/eoh.py

"""
EOH (Edge Oriented Histogram).

Implementation by: Cristiano Fraga G. Nunes <cfgnunes@gmail.com>

References:
[1] https://dx.doi.org/10.3390/s120912661
"""

import cv2
import numpy as np


class EOH():
    """EOH (Edge Oriented Histogram)."""

    # A constant to split the region into NxN subregions
    _N_SUBREGIONS = 4

    def __init__(self, window_size=80):
        """Class constructor.

        Args:
            window_size (int, optional):
                image window size around the keypoint, image patch.
        """
        self._window_size = window_size
        self._sobel_filters = self._get_sobel_filters()
        self._n_filters = self._sobel_filters.shape[0]

    def compute(self, image, keypoints):
        """Compute the descriptor for each keypoint.

        Args:
            image (numpy.ndarray): input image.
            keypoints (numpy.ndarray): keypoints.

        Returns:
            numpy.ndarray: descriptors for each keypoint.
                Shape: (n_keypoints, descriptor_size).
        """
        if not keypoints:
            return None

        descriptors = np.zeros(
            (len(keypoints), self.descriptor_size()), self.descriptor_type())

        # Compute the 'Maximum Index Map'
        mim = self._compute_maximum_index_map(image)

        # Compute the descriptor for each keypoint
        for i, keypoint in enumerate(keypoints):

            # Crop a window image around the keypoint
            mim_window = self._crop_window(
                mim, keypoint.pt, self._window_size)

            if mim_window is None:
                continue

            # Compute the histogram for all subregions
            histograms_window = self._compute_histogram_subregions(
                mim_window, self._n_filters, self._N_SUBREGIONS)

            # Concatenate all histograms in a single array
            histogram = np.concatenate(histograms_window)

            # Normalize the histogram to unit length
            norm = np.linalg.norm(histogram)
            if norm > 0:
                histogram = histogram / norm

            descriptors[i] = histogram

        return keypoints, descriptors

    def _compute_maximum_index_map(self, image):
        """Compute the 'Maximum Index Map' from a input image.

        Compute a 'Maximum Index Map': a matrix containing the index
        values of maximum filters responses. Each matrix value represents
        which filter had a maximum response for that pixel coordinate.

        Args:
            image (numpy.ndarray): the input image.

        Returns:
            numpy.ndarray: a matrix containing the index values of maximum
                filters responses (Maximum Index Map). Shape: (height, width).
        """
        # Apply the Sobel filters in the input image
        image_responses = self._apply_filters(image, self._sobel_filters)

        # Compute the 'Maximum Index Map' using argmax
        mim = np.argmax(image_responses, axis=0)

        # Apply the Canny edge detector
        image_edge = self._apply_canny(image)

        # Apply a mask in 'Maximum Index Map' using the image edge
        mim += (~(image_edge > 0) * self._n_filters)

        return mim

    def descriptor_size(self):
        """Get the size of the descriptor.

        Returns:
            int: the size of the descriptor.
        """
        return self._N_SUBREGIONS * self._N_SUBREGIONS * self._n_filters

    @staticmethod
    def descriptor_type():
        """Get the type of the descriptor.

        Returns:
            numpy.float32: the type of the descriptor.
        """
        return np.float32

    @staticmethod
    def _apply_filters(image, filters):
        """Apply kernel filters in the input image.

        Args:
            image (numpy.ndarray): input image.
            filters (numpy.ndarray): filters.
                Shape: (n_filters, filter_height, filter_width)

        Returns:
            numpy.ndarray: image responses to the filters.
                Shape: (n_filters, image_height, image_width).
        """
        n_filters = filters.shape[0]

        image_h, image_w = image.shape[:2]
        image_float = image.copy().astype(np.float32)

        image_responses = np.zeros((n_filters, image_h, image_w), np.float32)

        for i in range(n_filters):
            image_responses[i, :, :] = np.abs(
                cv2.filter2D(
                    src=image_float, ddepth=-1, kernel=filters[i, :, :]))

        return image_responses

    @staticmethod
    def _compute_histogram_subregions(image, n_bins, n_subregions):
        """Split an image into subregions and compute its histograms.

        Args:
            image (numpy.ndarray): input image.
            n_bins (int): number of bins in the histogram.
            n_subregions (int): number of NxN subregions.

        Returns:
            list of numpy.ndarray: list of histograms for each subregion.
        """
        histograms = []
        image_h, image_w = image.shape[:2]

        # Note: splitting the window into subregions keeps important spatial
        # information in the final descriptor.
        for i in range(n_subregions):
            for j in range(n_subregions):
                y_1 = i * int(image_h / n_subregions + 0.5)
                x_1 = j * int(image_w / n_subregions + 0.5)
                y_2 = (i + 1) * int(image_h / n_subregions + 0.5)
                x_2 = (j + 1) * int(image_w / n_subregions + 0.5)

                # For non-squared regions (if the splitting is not exact)
                if i == n_subregions - 1:
                    y_2 += image_h - y_2
                if j == n_subregions - 1:
                    x_2 += image_w - x_2

                # Crop a subregion from the 'Maximum Index Map'
                subregion = image[y_1:y_2, x_1:x_2]

                # Compute the histogram for the subregion
                histogram, _ = np.histogram(
                    subregion, bins=n_bins, range=[0, n_bins - 1])

                # Add the histogram of the subregion to the histogram list
                histograms.append(histogram)

        return histograms

    @staticmethod
    def _crop_window(image, center, size):
        """Crop a squared window from an image.

        Args:
            image (numpy.ndarray): input image.
            center (tuple of (int, int)): coord. of the center (x, y).
            size (int): the squared size of the window.

        Returns:
            numpy.ndarray: output window image.
        """
        image_h, image_w = image.shape[:2]
        center_x, center_y = int(center[0] + 0.5), int(center[1] + 0.5)
        half_size = size // 2
        size_even = 1 - size % 2

        # Check the boundaries
        y_1 = max(0, center_y - half_size)
        x_1 = max(0, center_x - half_size)
        y_2 = min(image_h, center_y + half_size + 1 - size_even)
        x_2 = min(image_w, center_x + half_size + 1 - size_even)

        # Ignore incomplete windows
        if y_2 - y_1 != size or x_2 - x_1 != size:
            return None

        return image[y_1:y_2, x_1:x_2]

    @staticmethod
    def _get_sobel_filters():
        """Return a filter bank with Sobel filters.

        Returns:
            numpy.ndarray: the Sobel filters. Shape: (n_filters, 3, 3).
        """
        filter_bank = [
            [[1, 2, 1], [0, 0, 0], [-1, -2, -1]],       # Horizontal filter
            [[-1, 0, 1], [-2, 0, 2], [-1, 0, 1]],       # Vertical filter
            [[2, 2, -1], [2, -1, -1], [-1, -1, -1]],    # 45 filter
            [[-1, 2, 2], [-1, -1, 2], [-1, -1, -1]],    # 135 filter
            [[-1, 0, 1], [0, 0, 0], [1, 0, -1]],        # No orientation filter
        ]

        return np.array(filter_bank)

    @staticmethod
    def _apply_canny(image):
        """Detect image edges with Canny algorithm.

        Args:
            image (numpy.ndarray): input image.

        Returns:
            numpy.ndarray: output image (edges).
        """
        # Apply a Gaussian filter to eliminate noise
        sig = 3
        image_blur = cv2.GaussianBlur(
            src=image, ksize=(sig * 3, sig * 3), sigmaX=sig, sigmaY=sig)

        # Find automatic good threshold values for Canny edge detector
        otsu, _ = cv2.threshold(
            src=image_blur, thresh=0, maxval=255, type=cv2.THRESH_OTSU)

        threshold = otsu * 0.5
        image_edge = cv2.Canny(image_blur, 0.5 * threshold, threshold)

        return image_edge