Source code for pandora.matching_cost.zncc

#!/usr/bin/env python
# coding: utf8
#
# Copyright (c) 2026 Centre National d'Etudes Spatiales (CNES).
#
# This file is part of PANDORA
#
#     https://github.com/CNES/Pandora
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
"""
This module contains functions associated to ZNCC method used in the cost volume measure step.
"""

from typing import Dict, Union, Tuple, List

import numpy as np
import xarray as xr
from json_checker import Checker, And

from pandora.img_tools import shift_right_img, compute_mean_raster, compute_std_raster
from pandora.matching_cost import matching_cost

from pandora.profiler import profile


@matching_cost.AbstractMatchingCost.register_subclass("zncc")

[docs]
class Zncc(matching_cost.AbstractMatchingCost):
    """
    Zero mean normalized cross correlation
    Zncc class allows to compute the cost volume
    """

    @profile("zncc.__init__")
    def __init__(self, **cfg: Union[str, int]) -> None:
        """
        :param cfg: optional configuration,  {'window_size': value, 'subpix': value}
        :type cfg: dictionary
        :return: None
        """
        super().instantiate_class(**cfg)


[docs]
    def check_conf(self, **cfg: Dict[str, Union[str, int]]) -> Dict[str, Union[str, int]]:
        """
        Add default values to the dictionary if there are missing elements and check if the dictionary is correct

        :param cfg: matching cost configuration
        :type cfg: dict
        :return cfg: matching cost configuration updated
        :rtype: dict
        """
        cfg = super().check_conf(**cfg)

        schema = self.schema
        schema["matching_cost_method"] = And(str, lambda input: input == "zncc")
        schema["window_size"] = And(int, lambda input: input > 0 and (input % 2) != 0)

        checker = Checker(schema)
        checker.validate(cfg)
        return cfg



[docs]
    def point_interval(
        self, img_left: xr.Dataset, img_right: xr.Dataset, disp: float
    ) -> Tuple[Tuple[int, int], Tuple[int, int]]:
        """
        Update point_p and point_q values if abs(disp) > nb_col - (int(self._window_size / 2) * 2).

        :param img_left: left Dataset image containing :

                - im: 2D (row, col) or 3D (band_im, row, col) xarray.DataArray float32
                - disparity (optional): 3D (disp, row, col) xarray.DataArray float32
                - msk (optional): 2D (row, col) xarray.DataArray int16
                - classif (optional): 3D (band_classif, row, col) xarray.DataArray int16
                - segm (optional): 2D (row, col) xarray.DataArray int16
                - edges (optional): 2D (row, col) xarray.DataArray int16
        :type img_left: xarray.Dataset
        :param img_right: right Dataset image containing :

                - im: 2D (row, col) or 3D (band_im, row, col) xarray.DataArray float32
                - disparity (optional): 3D (disp, row, col) xarray.DataArray float32
                - msk (optional): 2D (row, col) xarray.DataArray int16
                - classif (optional): 3D (band_classif, row, col) xarray.DataArray int16
                - segm (optional): 2D (row, col) xarray.DataArray int16
                - edges (optional): 2D (row, col) xarray.DataArray int16
        :type img_right: xarray.Dataset
        :param disp: current disparity
        :type disp: float
        :return: the range of the left and right image over which the similarity measure will be applied
        :rtype: tuple
        """

        point_p, point_q = super().point_interval(img_left, img_right, disp)

        nx_left = int(img_left.sizes["col"])
        nx_right = int(img_right.sizes["col"])

        if abs(disp) > nx_right - (int(self._window_size / 2) * 2):
            point_p = (nx_left, nx_left)
            point_q = (nx_right, nx_right)

        return point_p, point_q


    @profile("zncc.compute_cost_volume")

[docs]
    def compute_cost_volume(
        self,
        img_left: xr.Dataset,
        img_right: xr.Dataset,
        cost_volume: xr.Dataset,
    ) -> xr.Dataset:
        """
        Computes the cost volume for a pair of images

        :param img_left: left Dataset image containing :

                - im: 2D (row, col) or 3D (band_im, row, col) xarray.DataArray float32
                - disparity (optional): 3D (disp, row, col) xarray.DataArray float32
                - msk (optional): 2D (row, col) xarray.DataArray int16
                - classif (optional): 3D (band_classif, row, col) xarray.DataArray int16
                - segm (optional): 2D (row, col) xarray.DataArray int16
                - edges (optional): 2D (row, col) xarray.DataArray int16
        :type img_left: xarray.Dataset
        :param img_right: right Dataset image containing :

                - im: 2D (row, col) or 3D (band_im, row, col) xarray.DataArray float32
                - disparity (optional): 3D (disp, row, col) xarray.DataArray float32
                - msk (optional): 2D (row, col) xarray.DataArray int16
                - classif (optional): 3D (band_classif, row, col) xarray.DataArray int16
                - segm (optional): 2D (row, col) xarray.DataArray int16
                - edges (optional): 2D (row, col) xarray.DataArray int16
        :type img_right: xarray.Dataset
        :param cost_volume: an empty cost volume
        :type cost_volume: xr.Dataset
        :return: the cost volume dataset , with the data variables:

                - cost_volume 3D xarray.DataArray (row, col, disp)
        :rtype: xarray.Dataset
        """
        # check band parameter
        self.check_band_input_mc(img_left, img_right)

        # Contains the shifted right images
        img_right_shift = shift_right_img(img_right, self._subpix, self._band, self._spline_order)

        # Computes the standard deviation raster for the whole images
        # The standard deviation raster is truncated for points that are not calculable
        img_left_std = compute_std_raster(img_left, self._window_size, self._band)
        img_right_std = []
        for i, img in enumerate(img_right_shift):  # pylint: disable=unused-variable
            img_right_std.append(compute_std_raster(img, self._window_size, self._band))

        # Computes the mean raster for the whole images
        # The standard mean raster is truncated for points that are not calculable
        img_left_mean = compute_mean_raster(img_left, self._window_size, self._band)
        img_right_mean = []
        for i, img in enumerate(img_right_shift):
            img_right_mean.append(compute_mean_raster(img, self._window_size, self._band))

        # Cost volume metadata
        offset_row_col = cost_volume.attrs["offset_row_col"]
        cost_volume.attrs.update(
            {
                "type_measure": "max",
                "cmax": 1,  # Maximal cost of the cost volume with zncc measure
            }
        )

        disparity_range = cost_volume.coords["disp"].data
        cv = self.allocate_numpy_cost_volume(img_left, disparity_range)
        cv_crop = self.crop_cost_volume(cv, offset_row_col)

        # Computes the matching cost
        for disp_index, disp in enumerate(disparity_range):
            i_right = int((disp % 1) * self._subpix)
            point_p, point_q = self.point_interval(img_left, img_right_shift[i_right], disp)

            # Point interval in the left standard deviation image
            # -  (win_radius * 2) because img_std is truncated for points that are not calculable
            p_std = (point_p[0], point_p[1] - (int(self._window_size / 2) * 2))
            # Point interval in the right standard deviation image
            q_std = (point_q[0], point_q[1] - (int(self._window_size / 2) * 2))

            if self._band is not None:
                band_index_left = list(img_left.band_im.data).index(self._band)
                band_index_right = list(img_right.band_im.data).index(self._band)
                if len(img_right_shift[i_right]["im"].shape) > 2:
                    # Compute the normalized summation of the product of intensities
                    zncc_ = (
                        img_left["im"].data[band_index_left, :, point_p[0] : point_p[1]]
                        * img_right_shift[i_right]["im"].data[band_index_right, :, point_q[0] : point_q[1]]
                    )
                else:
                    # Compute the normalized summation of the product of intensities
                    zncc_ = (
                        img_left["im"].data[band_index_left, :, point_p[0] : point_p[1]]
                        * img_right_shift[i_right]["im"].data[:, point_q[0] : point_q[1]]
                    )
            else:
                # Compute the normalized summation of the product of intensities
                zncc_ = (
                    img_left["im"].data[:, point_p[0] : point_p[1]]
                    * img_right_shift[i_right]["im"].data[:, point_q[0] : point_q[1]]
                )

            zncc_ = xr.Dataset(
                {"im": (["row", "col"], zncc_)},
                coords={
                    "row": np.arange(zncc_.shape[0]),
                    "col": np.arange(zncc_.shape[1]),
                },
            )
            zncc_ = compute_mean_raster(zncc_, self._window_size, self._band)
            # Subtracting  the  local mean  value  of  intensities
            zncc_ -= img_left_mean[:, p_std[0] : p_std[1]] * img_right_mean[i_right][:, q_std[0] : q_std[1]]

            # Divide by the standard deviation of the intensities of the images
            apply_divide_standard(zncc_, img_left_std, img_right_std, p_std, q_std, i_right)

            # Places the result in the cost_volume
            cv_crop[disp_index, point_p[0] : p_std[1], :] = np.swapaxes(zncc_, 0, 1)

        # Create the xarray.DataSet that will contain the cost_volume of dimensions (row, col, disp)
        # Computations were optimized with a cost_volume of dimensions (disp, row, col)
        # As we are expected to return a cost_volume of dimensions (row, col, disp),
        # we swap axes.
        cv = np.swapaxes(cv, 0, 2)
        index_col = cost_volume.attrs["col_to_compute"]
        index_col = index_col - img_left.coords["col"].data[0]  # If first col coordinate is not 0
        cost_volume["cost_volume"].data = cv[:, index_col, :]

        return cost_volume





[docs]
def apply_divide_standard(
    zncc: np.ndarray,
    img_left: np.ndarray,
    img_right: List[np.ndarray],
    p_std: Tuple[int, int],
    q_std: Tuple[int, int],
    i_right: int,
):
    """
    Divide by the standard deviation of the intensities of the images

    :param zncc:
    :type zncc: np.ndarray
    :param img_left: standard deviation raster of left image
    :type img_left: np.ndarray
    :param img_right: standard deviation raster list of right image (for each subpix)
    :type img_right: List[np.ndarray]
    :param p_std: point interval in the left standard deviation image
    :type p_std: Tuple[int, int]
    :param q_std: Point interval in the right standard deviation image
    :type q_std: Tuple[int, int]
    :param i_right: ith image
    :type i_right: int
    """
    # If the standard deviation of the intensities of the images is greater than 0
    divide_standard = np.multiply(
        img_left[:, p_std[0] : p_std[1]],
        img_right[i_right][:, q_std[0] : q_std[1]],
    )
    valid = np.where(divide_standard > 0)
    zncc[valid] /= divide_standard[valid]

    # Otherwise zncc is equal to 0
    zncc[np.where(divide_standard <= 0)] = 0