Source code for darsia.corrections.shape.translation

"""Module defining estimator for translation between ROIs and corresponding correction.

"""

from pathlib import Path
from typing import Optional, Union

import cv2
import matplotlib.pyplot as plt
import numpy as np

import darsia
from darsia.utils.features import FeatureDetection



[docs]
class TranslationEstimator:
    """Estimator of translation to align images based on feature detection.

    Estimation is performed by restriction to ROIs.

    """

    def __init__(self, max_features: int = 200, tol: float = 0.05, keep_percent=0.1):
        """Setup of user-defined tuning parameters.

        Args:
            max_features (int): feature detection parameter
            tol (float): tolerance used to detect whether matching transformation is a
                translation

        """
        self._max_features = max_features
        self._keep_percent = keep_percent
        self._tol = tol


[docs]
    def find_effective_translation(
        self,
        img_src: np.ndarray,
        img_dst: np.ndarray,
        roi_src: Optional[tuple] = None,
        roi_dst: Optional[tuple] = None,
        mask_src: Optional[np.ndarray] = None,
        mask_dst: Optional[np.ndarray] = None,
        plot_matches: bool = False,
    ) -> tuple:
        """Find translation to align two images through feature matching.

        All lengths are measured in number of pixels.

        Args:
            img_src (np.ndarray): source image
            img_dst (np.ndarray): destination image
            roi_src (tuple of slices): region of interested associated to the source image
            roi_dst (tuple of slices): region of interested associated to the destination image
            mask_src (np.ndarray, optional): boolean mask detecting considered pixels in
                the analysis; if None, all pixels are considered.
            mask_dst (np.ndarray, optional): boolean mask detecting considered pixels in
                the analysis; if None, all pixels are considered.
            plot_matches (bool): flag controlling whether the matching features are plotted;
                useful for debugging; default value is False

        Returns:
            np.ndarray: transformation matrix operating on pixel coordinates using reverse
                matrix indexing
            bool: flag indicating whether the procedure was successful

        """
        # Make several attempts to find a matching transformation.
        # First attempt to match both images, using a homography.
        # Finding a homography is the preferred approach, as it
        # allows for slightly more robustness control as transformation
        # models with less DOFs; a homography has 8 DOFs. Robustness is
        # later checked by comparing the linear contribution with the
        # identity matrix.
        # If the first attempt was not successful, try a second attempt.
        # Here, not a homography will be set up, but a similarity transform, i.e.,
        # an affine map describing scaling, rotation, and translation. This boils
        # down to 4 DOFs. Thus, the robustness comparison is easier to trick
        # compared to the first case.
        for transformation_type in ["homography", "partial_affine"]:
            transformation, _, matches = self._find_matching_transformation(
                img_src,
                img_dst,
                roi_src,
                roi_dst,
                mask_src,
                mask_dst,
                transformation_type=transformation_type,
                keep_percent=self._keep_percent,
                return_matches=True,
                plot_matches=plot_matches,
            )

            # Check whether the transformation is close to a translation and extract the
            # effective translation (as affine map) as average translation between the
            # matches.
            if self._isclose_translation(transformation):
                (translation, intact_translation) = self._find_translation(matches)
            else:
                translation = None
                intact_translation = False

            # Accept resulting transformation if it can be casted as translation
            if intact_translation:
                break

        return translation, intact_translation



[docs]
    def match_roi(
        self,
        img_src: Union[np.ndarray, darsia.Image],
        img_dst: Union[np.ndarray, darsia.Image],
        roi_src: Optional[tuple] = None,
        roi_dst: Optional[tuple] = None,
        plot_matches: bool = False,
    ) -> np.ndarray:
        """Align two images through feature matching in provided ROIs.

        Args:
            img_src (np.ndarray or darsia.Image): source image
            img_dst (np.ndarray or darsia.Image): destination image
            roi_src (tuple of slices): region of interested associated to the source image
            roi_dst (tuple of slices): region of interested associated to the destination image
                translation
            plot_matches (bool): flag controlling whether the matching features are plotted;
                useful for debugging; default value is False

        Returns:
            np.ndarray, optional: aligned source image, if input of type array

        """
        # Determine effective translation
        if isinstance(img_src, np.ndarray) and isinstance(img_dst, np.ndarray):
            return self._match_roi_arrays(
                img_src, img_dst, roi_src, roi_dst, plot_matches
            )
        elif isinstance(img_src, darsia.Image) and isinstance(img_dst, darsia.Image):
            return self._match_roi_images(
                img_src, img_dst, roi_src, roi_dst, plot_matches
            )
        else:
            raise ValueError("Provide images either as numpy arrays or darsia Images.")


    def _match_roi_arrays(
        self,
        img_src: np.ndarray,
        img_dst: np.ndarray,
        roi_src: Optional[tuple],
        roi_dst: Optional[tuple],
        plot_matches: bool = False,
    ) -> np.ndarray:
        """Align two images through feature matching in provided ROIs.

        Args:
            img_src (np.ndarray): source image
            img_dst (np.ndarray): destination image
            roi_src (tuple of slices): region of interested associated to the source image
            roi_dst (tuple of slices): region of interested associated to the destination image
                translation
            plot_matches (bool): flag controlling whether the matching features are plotted;
                useful for debugging; default value is False

        Returns:
            np.ndarray: aligned source image

        """
        # Determine effective translation
        translation, intact_translation = self.find_effective_translation(
            img_src, img_dst, roi_src, roi_dst, None, None, plot_matches
        )

        if not intact_translation:
            raise ValueError("ROIs cannot be aligned by translation.")

        # Apply translation - Change the source and return it
        (h, w) = img_dst.shape[:2]
        aligned_img_src = cv2.warpAffine(img_src, translation, (w, h))
        return aligned_img_src

    def _match_roi_images(
        self,
        img_src: darsia.Image,
        img_dst: darsia.Image,
        roi_src: Optional[tuple],
        roi_dst: Optional[tuple],
        plot_matches: bool = False,
    ) -> np.ndarray:
        """Align two images through feature matching in provided ROIs.

        Args:
            img_src (image): source image, which will be modified and aligned
            img_dst (image): destination image
            roi_src (tuple of slices): region of interested associated to the source image
            roi_dst (tuple of slices): region of interested associated to the destination image
                translation
            plot_matches (bool): flag controlling whether the matching features are plotted;
                useful for debugging; default value is False

        """
        # Determine effective translation
        translation, intact_translation = self.find_effective_translation(
            img_src.img, img_dst.img, roi_src, roi_dst, None, None, plot_matches
        )

        if not intact_translation:
            raise ValueError("ROIs cannot be aligned by translation.")

        # Apply translation - Modify image internally
        (h, w) = img_dst.img.shape[:2]
        aligned_img_src = cv2.warpAffine(img_src.img, translation, (w, h))
        return aligned_img_src

    def _find_matching_transformation(
        self,
        img_src: np.ndarray,
        img_dst: np.ndarray,
        roi_src: Optional[tuple] = None,
        roi_dst: Optional[tuple] = None,
        mask_src: Optional[np.ndarray] = None,
        mask_dst: Optional[np.ndarray] = None,
        transformation_type: str = "homography",
        keep_percent: float = 0.1,
        return_matches: bool = False,
        plot_matches: bool = False,
    ) -> tuple:
        """Determine matching map (homography or partial affine transformation).

        Args:
            img_src (np.ndarray): source image
            img_dst (np.ndarry): destination image
            roi_src (tuple of slices, optional): region of interest for the source image
            roi_dst (tuple of slices, optional): region of interest for the destination image
            mask_src (np.ndarray, optional): boolean mask detecting considered pixels in
                the analysis; if None, all pixels are considered.
            mask_dst (np.ndarray, optional): boolean mask detecting considered pixels in
                the analysis; if None, all pixels are considered.
            transformation_type (str): either "homography" or "partial_affine"
            keep_percent (float): how much of the features should be considered for finding
                the transformation
            return_matches (bool): flag controlling whether the inliers among all matches
                are returned
            plot_matches (bool): flag controlling whether found matches are plotted;
                default is False

        Returns:
            np.ndarray: transformation matrix operating on pixel coordinates using reverse
                matrix indexing
            bool: flag indicating whether the procedure was successful

        """
        if transformation_type not in ["homography", "partial_affine"]:
            raise ValueError(
                f"Transformation type {transformation_type} not supported."
            )

        # Manage ROIs
        if roi_src is not None:
            if roi_dst is None:
                roi_dst = roi_src

            # Only cover the case of compatible ROIs for now.
            assert img_src[roi_src].shape == img_dst[roi_dst].shape

        # Only continue if images contain a sufficient amount of pixels.
        if min(img_src.shape[:2]) < 2:
            have_features_src = have_features_dst = False
        else:
            # Extract features for both images restricted to the ROI.
            # Pixel coordinates are prescibed using reverse matrix indexing.
            features_src, have_features_src = FeatureDetection.extract_features(
                img_src, roi_src, mask_src, self._max_features
            )
            features_dst, have_features_dst = FeatureDetection.extract_features(
                img_dst, roi_dst, mask_dst, self._max_features
            )

        # Check whether features are valid
        if not (have_features_src and have_features_dst):
            if return_matches:
                return None, False, None
            else:
                return None, False

        # Determine matching points
        (pts_src, pts_dst), have_match, matches = FeatureDetection.match_features(
            features_src, features_dst, keep_percent=keep_percent, return_matches=True
        )

        # Determine matching transformation, operating on pixel coordinates using
        # reverse matrix indexing. Allow for different models.
        transformation = None
        if have_match:
            # Homography
            if transformation_type == "homography":
                transformation, mask = cv2.findHomography(
                    pts_src, pts_dst, method=cv2.RANSAC
                )
            # Affine map including merely scaling, rotation, and translation
            elif transformation_type == "partial_affine":
                transformation, mask = cv2.estimateAffinePartial2D(pts_src, pts_dst)

        # Monitor success
        intact_transformation = transformation is not None

        # Flag inliers
        inliers = (
            (
                pts_src[mask[:, 0].astype(bool)].reshape(-1, 2),
                pts_dst[mask[:, 0].astype(bool)].reshape(-1, 2),
            )
            if intact_transformation
            else None
        )

        # Plot matches in both images
        if plot_matches and intact_transformation:
            kps_src, _ = features_src
            kps_dst, _ = features_dst

            matchedVis = cv2.drawMatches(
                img_src, kps_src, img_dst, kps_dst, matches, None
            )

            plt.imshow(matchedVis)
            plt.show()

        if return_matches:
            return transformation, intact_transformation, inliers
        else:
            return transformation, intact_transformation

    def _isclose_translation(self, transformation: np.ndarray) -> bool:
        """Checking whether a transformation is close to a translation.

        Args:
            transformation (np.ndarray): transformation matrix, e.g., homography,
                or affine map

        Returns:
            bool: flag whether transformation is close to a translation

        """
        return transformation is not None and np.allclose(
            transformation[:2, :2], np.eye(2), atol=self._tol
        )

    def _find_translation(self, matches: tuple) -> tuple:
        """Determine a translation as average translation between two sets of points.

        NOTE: The average translation is identical to the least squares minimizer
        among all translations. Including RANSAC would be optimal. However, in
        all workflows this method will be combined with methods like
        find_matching_transformation which involve RANSAC.

        Args:
            matches (tuple of arrays): src and dst points, which are supposed to
                be a translation from each other apart.
        Returns:
            np.ndarray: translation matrix
            bool: flag indicating whether the procedure was successful

        """
        # Extract the translation directly as average displacement from all
        # provided matches - have to assume that the matches are well chosen.
        # NOTE: As matches will result as output from cv2 routines, these use
        # (col, row)-indexing, i.e., reverse matrix indexing.
        src, dst = matches
        displacement = np.average(dst - src, axis=0)
        affine_translation = np.hstack((np.eye(2), displacement.reshape((2, 1))))

        # Procedure successful - return the translation
        return affine_translation, True




[docs]
class TranslationCorrection(darsia.BaseCorrection):
    """Translation correction based on user-input global translation.

    Translation is provided as array or path to numpy array.

    """

    def __init__(self, translation: Optional[Union[str, Path]] = None):
        """Contructor.

        Args:
            translation (str or Path): path to predefined translation.

        """

        # Read translation from file
        if translation is not None:
            self.translation = np.load(Path(translation))
            """Translation map/array."""

            self.active = True
            """Flag controlling whether the correction is active."""

        else:
            self.active = False


[docs]
    def correct_array(self, img: np.ndarray) -> np.ndarray:
        """Main routine. Perform translation.

        Args:
            img (np.ndarray): image to be corrected.

        Returns:
            array: Corrected image

        """
        (h, w) = img.shape[:2]
        translated_img = cv2.warpAffine(img, self.translation, (w, h))
        return translated_img


    # ! ---- I/O ----


[docs]
    def save(self, path: Path) -> None:
        raise NotImplementedError("Not implemented yet.")



[docs]
    def load(self, path: Path) -> None:
        raise NotImplementedError("Not implemented yet.")