Source code for minian.motion_correction

import itertools as itt
import warnings
from typing import Any

import cv2
import dask as da
import dask.array as darr
import numpy as np
import SimpleITK as sitk
import xarray as xr
from skimage.registration import phase_cross_correlation

from .utilities import xrconcat_recursive



[docs]
def estimate_motion(
    varr: xr.DataArray,
    dim: str = "frame",
    npart: int = 3,
    chunk_nfm: int | None = None,
    mesh_size: tuple[int, int] | None = None,
    **kwargs: Any,
) -> xr.DataArray:
    """
    Estimate motion for each frame of the input movie data.

    This function estimates motion using a recursive approach. The movie is
    splitted into chunks of `npart` frames and motion estimation is carried out
    within each chunk relative to the middle frame, then a template is generated
    for each chunk by aggregating the motion-corrected frames within each chunk.
    Next, every `npart` chunks are grouped together, and motion estimation is
    carried out within each group relative to the middle chunk using the
    aggregated templates. The chunk-level motions are added on top of the
    previous within-chunk level motions. This step is then repeated recursively
    until we are left with a single chunk representing the full movie, at which
    point the motion estimation is finished.

    The motion estimation itself is carried out with fft-based phase correlation
    by default. Alternatively, non-rigid motion correction can be carried out by
    modelling the motion of each frame as translations of individual vertices of
    a smooth BSpline mesh. The estimation of the translations can then be find
    by gradient descent using correlation between frames as objective. This
    feature is currently experimental. Additionally, various correction
    procedures can be carry out to filter out frames not suited as template for
    motion correction, or to correct for large false shifts when the quality of
    templates are low.

    Parameters
    ----------
    varr : xr.DataArray
        Input movie data.
    dim : str, optional
        The dimension along which motion estimation should be carried out. By
        default `"frame"`.
    npart : int, optional
        Number of frames/chunks to combine for the recursive algorithm. By
        default `3`.
    chunk_nfm : int, optional
        Number of frames in each parallel task. Note that this only affects dask
        graph construction, but not the recursion of the algorithm. If `None`
        then the dask chunksize along `dim` will be used. By default `None`.

    Keyword Arguments
    -----------------
    alt_error : float, optional
        Error threshold between estimated shifts from two alternative methods,
        specified in pixels. If not `None`, then for each chunk during
        recursion, the first and last frame of that chunk will be returned in
        addition to the aggregated template. And when estimating motion between
        chunks, the estimation will be carried out twice: once using the
        aggregated templates, once using the consecutive first/last frames
        between chunks. The result of these two methods will then be compared.
        If their absolute difference is larger than `alt_error`, then the result
        with smaller absolute value (closer to zero shifts) will be used. This
        is useful to correct for cases where activities of cells are sparse and
        changing across chunks, leading to wrong features being matched in
        aggregated templates. If `None` then no additional checking will be
        performed. By default `5`.
    aggregation : str, optional
        How frames should be aggregated to generate the template for each chunk.
        Should be either "mean" or "max". By default `"mean"`.
    upsample : int, optional
        The upsample factor for sub-pixel accuracy on the non-rigid
        (`mesh_size`) path. The rigid path refines the cross-correlation peak by
        parabolic interpolation instead and ignores this factor.
    circ_thres : float, optional
        The circularity threshold to check whether a frame can serve as a good
        template for estimating motion. If not `None`, then for each frame a
        comparison image is computed using :func:`cv2.matchTemplate` between the
        frame and zero-padded version (up to `max_sh`) using
        `cv2.TM_SQDIFF_NORMED`. The comparison image of a good template should
        only have `< 1` values around the center and the `< 1` region should be
        circular. Hence the circularity defined as `4 * np.pi * (area /
        (perimeter ** 2))` for the `< 1` region is computed, and any frame with
        circularity smaller than `circ_thres` is excluded from propagation of
        shifts and aggregation of templates. By default `None`.
    max_sh : int, optional
        Amount of zero padding when checking for the quality of frames,
        specified in pixels. Only used if `circ_thres is not None`. See
        `circ_thres` for more detail. By default `100`.
    mesh_size : tuple[int, int], optional
        Number of control points for the BSpline mesh in each dimension,
        specified in the order ("height", "width"). If not `None` then the
        experimental non-rigid motion estimation is enabled. By default `None`
    niter : int, optional
        Max number of iteration for the gradient descent process of estimation
        BSpline parameters. Only used if `mesh_size is not None`. By default
        `100`.
    bin_thres : int, optional
        Intensity threshold for binarizing the frames. The binarized frame will
        be used as masks for non-rigid motion estimation, where only pixels in
        the mask will be used to evaluate the gradient during optimization.
        Significantly improve performance but sacrifice accuracy of estimation
        for dim regions. Only used if `mesh_size is not None`. By default
        `None`.

    Returns
    -------
    motion : xr.DataArray
        Estimated motion for each frame. Has two dimensions `dim` and
        `"shift_dim"` representing rigid shifts in each direction if `mesh_size
        is None`, otherwise has four dimensions: `dim`, `"grid0"`, `"grid1"` and
        `"shift_dim"` representing shifts for each mesh grid control point.

    See Also
    --------
    :doc:`simpleitk:registrationOverview` :
        for overview of the non-rigid estimation method
    """
    varr = varr.transpose(..., dim, "height", "width")
    loop_dims = list(set(varr.dims) - {"height", "width", dim})
    if npart is None:
        # by default use a npart that result in two layers of recursion
        npart = max(3, int(np.ceil((varr.sizes[dim] / chunk_nfm) ** (1 / 2))))
    if loop_dims:
        loop_labs = [varr.coords[d].values for d in loop_dims]
        res_dict = {}
        for lab in itt.product(*loop_labs):
            va = varr.sel({loop_dims[i]: lab[i] for i in range(len(loop_dims))})
            vmax, sh = est_motion_part(va.data, npart, chunk_nfm, mesh_size=mesh_size, **kwargs)
            if mesh_size:
                sh = xr.DataArray(
                    sh,
                    dims=[dim, "shift_dim", "grid0", "grid1"],
                    coords={
                        dim: va.coords[dim].values,
                        "shift_dim": ["height", "width"],
                    },
                )
            else:
                sh = xr.DataArray(
                    sh,
                    dims=[dim, "shift_dim"],
                    coords={
                        dim: va.coords[dim].values,
                        "shift_dim": ["height", "width"],
                    },
                )
            res_dict[lab] = sh.assign_coords(**dict(zip(loop_dims, lab)))
        sh = xrconcat_recursive(res_dict, loop_dims)
    else:
        vmax, sh = est_motion_part(varr.data, npart, chunk_nfm, mesh_size=mesh_size, **kwargs)
        if mesh_size:
            sh = xr.DataArray(
                sh,
                dims=[dim, "shift_dim", "grid0", "grid1"],
                coords={
                    dim: varr.coords[dim].values,
                    "shift_dim": ["height", "width"],
                },
            )
        else:
            sh = xr.DataArray(
                sh,
                dims=[dim, "shift_dim"],
                coords={
                    dim: varr.coords[dim].values,
                    "shift_dim": ["height", "width"],
                },
            )
    return sh




[docs]
def est_motion_part(
    varr: darr.Array,
    npart: int,
    chunk_nfm: int,
    alt_error: float = 5,
    mesh_size: tuple[int, int] | None = None,
    **kwargs: Any,
) -> tuple[darr.Array, darr.Array]:
    """
    Construct dask graph for the recursive motion estimation algorithm.

    Parameters
    ----------
    varr : darr.Array
        Input dask array representing movie data.
    npart : int
        Number of frames/chunks to combine for the recursive algorithm.
    chunk_nfm : int
        Number of frames in each parallel task.
    alt_error : int, optional
        Error threshold between estimated shifts from two alternative methods,
        specified in pixels. By default `5`.
    mesh_size : tuple[int, int], optional
        Number of control points for the BSpline mesh in each dimension. If not
        `None` the experimental non-rigid motion estimation is enabled. By
        default `None`.

    Returns
    -------
    temps : darr.Array
        Registration template for the movie.
    shifts : darr.Array
        Estimated motion.
    See Also
    --------
    estimate_motion
    """
    if chunk_nfm is None:
        chunk_nfm = varr.chunksize[0]
    varr = varr.rechunk((chunk_nfm, None, None))
    has_mesh = bool(mesh_size)
    if has_mesh:
        param = get_bspline_param(varr[0].compute(), mesh_size)
    height, width = varr.shape[1], varr.shape[2]
    tmp_shape = (3, height, width) if alt_error else (height, width)
    sh_shape = (sum(varr.chunks[0]), 2)
    if has_mesh:
        sh_shape = sh_shape + (int(param[1]), int(param[0]))

    # Keep each chunk's result as one delayed `(template, shifts)` tuple and feed
    # the whole tuple into the next reduction step. Splitting it into separate
    # `res[0]`/`res[1]` dask nodes would route the shared `est_motion_chunk` task
    # through two graph paths and run it once per path -- a blow-up that compounds
    # with recursion depth. The final tuple is split once, at the end.
    res_ls = [
        da.delayed(est_motion_chunk)(
            blk, None, alt_error=alt_error, npart=npart, mesh_size=mesh_size, **kwargs
        )
        for blk in varr.blocks
    ]
    while len(res_ls) > 1:
        res_ls = [
            da.delayed(_est_motion_reduce)(
                res_ls[idx : idx + npart],
                alt_error,
                npart,
                mesh_size=mesh_size,
                **kwargs,
            )
            for idx in range(0, len(res_ls), npart)
        ]
    res = res_ls[0]
    temps = darr.from_delayed(res[0], shape=tmp_shape, dtype=varr.dtype)
    shifts = darr.from_delayed(res[1], shape=sh_shape, dtype=float)
    return temps, shifts



def _est_motion_reduce(
    res_grp: list, alt_error: float, npart: int, **kwargs: Any
) -> tuple[np.ndarray, np.ndarray]:
    """
    Combine a group of per-chunk results for one reduction step.

    Stacks the chunk templates into a single array and gathers their shifts, then
    runs :func:`est_motion_chunk` on the aggregate. Consumes the whole
    `(template, shifts)` tuples to avoid dask task duplication; see
    :func:`est_motion_part`.

    Parameters
    ----------
    res_grp : list
        list of `(template, shifts)` tuples for the chunks in this group.
    alt_error : float
        Error threshold between estimated shifts from two alternative methods.
    npart : int
        Number of frames/chunks to combine for the recursive algorithm.

    Returns
    -------
    tmp : np.ndarray
        Aggregated template for the group.
    motions : np.ndarray
        Combined motion estimates for the group.

    See Also
    --------
    est_motion_part
    est_motion_chunk
    """
    tmps = np.stack([r[0] for r in res_grp], axis=0)
    sh_org_ls = [r[1] for r in res_grp]
    return est_motion_chunk(tmps, sh_org_ls, alt_error=alt_error, npart=npart, **kwargs)



[docs]
def est_motion_chunk(
    varr: np.ndarray,
    sh_org: np.ndarray,
    npart: int,
    alt_error: float,
    aggregation: str = "mean",
    upsample: int = 100,
    max_sh: int = 100,
    circ_thres: float | None = None,
    mesh_size: tuple[int, int] | None = None,
    niter: int = 100,
    bin_thres: float | None = None,
) -> tuple[np.ndarray, np.ndarray]:
    """
    Carry out motion estimation per chunk.

    Parameters
    ----------
    varr : np.ndarray
        Input chunk of movie.
    sh_org : np.ndarray
        Original motions to be added upon.
    npart : int
        Number of frames/chunks to combine for the recursive algorithm.
    alt_error : float
        Error threshold between estimated shifts from two alternative methods,
        specified in pixels.
    aggregation : str, optional
        How frames should be aggregated to generate the template. By default
        `"mean"`.
    upsample : int, optional
        The upsample factor. By default `100`.
    max_sh : int, optional
        Amount of zero padding when checking for the quality of frames,
        specified in pixels. By default `100`.
    circ_thres : float, optional
        The circularity threshold to check whether a frame can serve as a good
        template for estimating motion. By default `None`.
    mesh_size : tuple[int, int], optional
        Number of control points for the BSpline mesh in each dimension. By
        default `None`.
    niter : int, optional
        Max number of iteration for the gradient descent process. By default `100`.
    bin_thres : float, optional
        Intensity threshold for binarizing the frames. By default `None`.

    Returns
    -------
    tmp : np.ndarray
        The template of current chunk for further motion estimation.
    motions : np.ndarray
        Motions between frames within the chunk.

    Raises
    ------
    ValueError
        if `aggregation` is not `"mean"` or `"max"`

    See Also
    --------
    estimate_motion : for detailed explanation of parameters
    """
    if varr.ndim == 3 and varr.shape[0] == 1:
        if sh_org is not None:
            motions = sh_org
        else:
            if mesh_size is not None:
                # TODO handle non-rigid case
                pass
            else:
                motions = np.array([0, 0])[np.newaxis, :]
        tmp = np.stack([varr[0]] * 3) if alt_error else varr[0]
        return tmp, motions
    while varr.shape[0] > npart:
        part_idx = np.array_split(np.arange(varr.shape[0]), np.ceil(varr.shape[0] / npart))
        tmp_ls = []
        sh_ls = []
        for idx in part_idx:
            cur_tmp, cur_motions = est_motion_chunk(
                varr[idx],
                [sh_org[i] for i in idx] if sh_org is not None else None,
                npart=npart,
                alt_error=alt_error,
                aggregation=aggregation,
                upsample=upsample,
                max_sh=max_sh,
                circ_thres=circ_thres,
                mesh_size=mesh_size,
                niter=niter,
                bin_thres=bin_thres,
            )
            tmp_ls.append(cur_tmp)
            sh_ls.append(cur_motions)
        varr = np.stack(tmp_ls, axis=0)
        sh_org = sh_ls
    # varr could have 4 dimensions in which case the second dimension has length
    # 3 representing the first, aggregated and the last frame of a chunk
    mask = np.ones_like(varr, dtype=bool)
    if bin_thres is not None and varr.ndim <= 3:
        for i, fm in enumerate(varr):
            mask[i] = fm > bin_thres
    good_fm = np.ones(varr.shape[0], dtype=bool)
    if circ_thres is not None and varr.ndim <= 3:
        for i, fm in enumerate(varr):
            good_fm[i] = check_temp(fm, max_sh) > circ_thres
    good_idxs = np.where(good_fm)[0].astype(int)
    prop_good = len(good_idxs) / len(good_fm)
    if prop_good < 0.9:
        warnings.warn(
            f"only {prop_good} of the frames are good.Consider lowering your circularity threshold",
            stacklevel=2,
        )
    # use good frame closest to center as template
    mid = good_idxs[np.abs(good_idxs - varr.shape[0] / 2).argmin()]
    if mesh_size is not None:
        fm0 = varr[0, 0] if varr.ndim > 3 else varr[0]
        param = get_bspline_param(fm0, mesh_size)
        motions = np.zeros((varr.shape[0], 2, int(param[1]), int(param[0])))
    else:
        motions = np.zeros((varr.shape[0], 2))
    # Precompute each frame's rfft2 once for the rigid path so it can be reused
    # across the two registrations it participates in (as src and as a
    # neighbour's dst). For 4D reduction input the registered image is the
    # aggregated frame (slot 1); alt-error additionally uses slots 0/2.
    use_fft = mesh_size is None
    fft_mid = fft_first = fft_last = None
    if use_fft:
        if varr.ndim > 3:
            fft_mid = np.fft.rfft2(varr[:, 1], axes=(-2, -1))
            if alt_error:
                fft_first = np.fft.rfft2(varr[:, 0], axes=(-2, -1))
                fft_last = np.fft.rfft2(varr[:, 2], axes=(-2, -1))
        else:
            fft_mid = np.fft.rfft2(varr, axes=(-2, -1))
    for i, _fm in enumerate(varr):
        src_fft = dst_fft = src_alt_fft = dst_alt_fft = None
        # register each frame against its neighbour toward the center frame
        if i < mid:
            j, slc = i + 1, slice(0, i + 1)
        elif i > mid:
            j, slc = i - 1, slice(i, None)
        else:
            continue
        if varr.ndim > 3:
            src, dst = varr[i][1], varr[j][1]
            src_ma, dst_ma = mask[i][1], mask[j][1]
            if use_fft:
                src_fft, dst_fft = fft_mid[i], fft_mid[j]
            if alt_error:
                # cross-chunk check against the adjacent first/last frames
                if i < mid:
                    src_alt, dst_alt = varr[i][2], varr[j][0]
                    src_alt_ma, dst_alt_ma = mask[i][2], mask[j][0]
                    if use_fft:
                        src_alt_fft, dst_alt_fft = fft_last[i], fft_first[j]
                else:
                    src_alt, dst_alt = varr[i][0], varr[j][2]
                    src_alt_ma, dst_alt_ma = mask[i][0], mask[j][2]
                    if use_fft:
                        src_alt_fft, dst_alt_fft = fft_first[i], fft_last[j]
        else:
            # select the nearest good frame toward the center as template
            if i < mid:
                didx = good_idxs[good_idxs - j >= 0][0]
            else:
                didx = good_idxs[good_idxs - j <= 0][-1]
            src, dst = varr[i], varr[didx]
            src_ma, dst_ma = mask[i], mask[didx]
            if use_fft:
                src_fft, dst_fft = fft_mid[i], fft_mid[didx]
        mo = est_motion_perframe(
            src,
            dst,
            upsample,
            src_ma,
            dst_ma,
            mesh_size,
            niter,
            src_fft=src_fft,
            dst_fft=dst_fft,
        )
        if alt_error and varr.ndim > 3:
            mo_alt = est_motion_perframe(
                src_alt,
                dst_alt,
                upsample,
                src_alt_ma,
                dst_alt_ma,
                mesh_size,
                niter,
                src_fft=src_alt_fft,
                dst_fft=dst_alt_fft,
            )
            if ((np.abs(mo - mo_alt) > alt_error).any()) and (
                np.abs(mo).sum() > np.abs(mo_alt).sum()
            ):
                mo = mo_alt
        # only add to the rest if current frame is good
        if good_fm[i]:
            motions[slc] = motions[slc] + mo
        else:
            motions[i] = motions[i] + mo
    # center shifts
    if mesh_size is not None:
        motions -= motions.mean(axis=(0, 2, 3), keepdims=True)
    else:
        motions -= motions.mean(axis=0)
    for i, v in enumerate(varr):
        if i not in good_idxs:
            continue
        if v.ndim > 2:
            for j, fm in enumerate(v):
                varr[i][j] = transform_perframe(fm, motions[i], fill=0)
        else:
            varr[i] = transform_perframe(v, motions[i], fill=0)
    varr = varr[good_idxs]
    if aggregation == "max":
        tmp = varr.max(axis=(0, 1)) if varr.ndim > 3 else varr.max(axis=0)
    elif aggregation == "mean":
        tmp = varr.mean(axis=(0, 1)) if varr.ndim > 3 else varr.mean(axis=0)
    else:
        raise ValueError(f"does not understand aggregation: {aggregation}")
    if alt_error:
        if varr.ndim > 3:
            tmp0 = varr[0][0]
            tmp1 = varr[-1][-1]
        else:
            tmp0 = varr[0]
            tmp1 = varr[1]
        tmp = np.stack([tmp0, tmp, tmp1], axis=0)
    if sh_org is not None:
        motions = np.concatenate([motions[i] + sh for i, sh in enumerate(sh_org)], axis=0)
    return tmp, motions



def _xcorr_subpixel(src_fft: np.ndarray, dst_fft: np.ndarray, shape: tuple[int, int]) -> np.ndarray:
    """
    Sub-pixel shift between two frames from their precomputed real FFTs.

    Computes the (un-normalized) cross-correlation -- matching
    :func:`skimage.registration.phase_cross_correlation` with
    `normalization=None` -- and refines the integer peak with a 1D parabolic fit
    along each axis. Taking precomputed `rfft2` results lets the caller reuse
    each frame's transform across the two registrations it participates in.

    Parameters
    ----------
    src_fft, dst_fft : np.ndarray
        `np.fft.rfft2` of the source and destination frames.
    shape : tuple[int, int]
        Spatial shape `(height, width)` of the frames.

    Returns
    -------
    shift : np.ndarray
        Shift `(height, width)` of src relative to dst; `-shift` registers src
        onto dst (the convention :func:`est_motion_perframe` returns).
    """
    # The cross-correlation peaks where src best aligns with dst; its (integer)
    # location is the whole-pixel shift between the two frames.
    cross_corr = np.fft.irfft2(src_fft * np.conj(dst_fft), s=shape)
    peak_idx = np.unravel_index(np.argmax(cross_corr), cross_corr.shape)
    peak_val = cross_corr[peak_idx]
    # Refine that integer peak to sub-pixel one axis at a time: fit a parabola
    # through the peak and its two immediate neighbours and take the vertex.
    # The FFT wraps negative shifts into the upper half of each axis, so a
    # refined position past the midpoint is folded back to a negative shift.
    shift = np.empty(2)
    for axis in range(2):
        axis_len = cross_corr.shape[axis]
        peak_pos = peak_idx[axis]
        # cross-correlation values at the neighbours one step below/above the peak
        idx_prev = list(peak_idx)
        idx_next = list(peak_idx)
        idx_prev[axis] = (peak_pos - 1) % axis_len
        idx_next[axis] = (peak_pos + 1) % axis_len
        val_prev = cross_corr[tuple(idx_prev)]
        val_next = cross_corr[tuple(idx_next)]
        denom = val_prev - 2 * peak_val + val_next
        delta = 0.5 * (val_prev - val_next) / denom if denom != 0 else 0.0
        refined_pos = peak_pos + delta
        if refined_pos > axis_len // 2:  # wrap negative shifts
            refined_pos -= axis_len
        shift[axis] = refined_pos
    return shift



[docs]
def est_motion_perframe(
    src: np.ndarray,
    dst: np.ndarray,
    upsample: int = 100,
    src_ma: np.ndarray | None = None,
    dst_ma: np.ndarray | None = None,
    mesh_size: tuple[int, int] | None = None,
    niter: int = 100,
    src_fft: np.ndarray | None = None,
    dst_fft: np.ndarray | None = None,
) -> np.ndarray:
    """
    Estimate motion given two frames.

    Parameters
    ----------
    src : np.ndarray
        The frame to be registered.
    dst : np.ndarray
        The destination frame of registration.
    upsample : int, optional
        Upsample factor. Only used for the non-rigid (`mesh_size`) path; the
        rigid path instead estimates sub-pixel shifts by fitting a parabola to
        the cross-correlation peak and its two neighbours along each axis. By
        default `100`.
    src_ma : np.ndarray, optional
        Boolean mask for `src`. Only used if `mesh_size is not None`. By default
        `None`.
    dst_ma : np.ndarray, optional
        Boolean mask for `dst`. Only used if `mesh_size is not None`. By default
        `None`.
    mesh_size : tuple[int, int], optional
        Number of control points for the BSpline mesh in each dimension. By
        default `None`.
    niter : int, optional
        Max number of iteration for the gradient descent process. By default
        `100`.
    src_fft, dst_fft : np.ndarray, optional
        Precomputed `np.fft.rfft2` of `src`/`dst` for the rigid path. If `None`
        they are computed on the fly. By default `None`.

    Returns
    -------
    motion : np.ndarray
        Estimated motion between two frames.

    See Also
    --------
    estimate_motion : for detailed explanation of parameters
    """
    if mesh_size is None:
        if src_fft is None:
            src_fft = np.fft.rfft2(src)
        if dst_fft is None:
            dst_fft = np.fft.rfft2(dst)
        return -_xcorr_subpixel(src_fft, dst_fft, src.shape)
    # TODO: This SimpleITK BSpline non-rigid path is experimental, likely unused
    # (the pipeline never sets `mesh_size`), and not ideal. Worth revisiting in
    # favour of a grid/patch-based piecewise-rigid approach like NoRMCorre, which
    # estimates a rigid shift per patch and interpolates between them.
    sh, error, phasediff = phase_cross_correlation(
        src,
        dst,
        upsample_factor=upsample,
        normalization=None,
    )
    src = sitk.GetImageFromArray(src.astype(np.float32))
    dst = sitk.GetImageFromArray(dst.astype(np.float32))
    reg = sitk.ImageRegistrationMethod()
    sh = sh[::-1]
    trans_init = sitk.TranslationTransform(2, sh)
    reg.SetMovingInitialTransform(trans_init)
    if src_ma is not None:
        reg.SetMetricMovingMask(sitk.GetImageFromArray(src_ma.astype(np.uint8)))
    if dst_ma is not None:
        reg.SetMetricFixedMask(sitk.GetImageFromArray(dst_ma.astype(np.uint8)))
    trans_opt = sitk.BSplineTransformInitializer(image1=dst, transformDomainMeshSize=mesh_size)
    reg.SetInitialTransform(trans_opt)
    reg.SetMetricAsCorrelation()
    reg.SetInterpolator(sitk.sitkLinear)
    reg.SetOptimizerAsGradientDescent(
        learningRate=0.1, convergenceMinimumValue=1e-5, numberOfIterations=niter
    )
    tx = reg.Execute(dst, src)
    coef = np.stack([sitk.GetArrayFromImage(im) for im in tx.Downcast().GetCoefficientImages()])
    coef = coef + sh.reshape((2, 1, 1))
    return coef



def match_temp(
    src: np.ndarray,
    dst: np.ndarray,
    max_sh: int,
    local: bool,
    subpixel: bool = False,
) -> np.ndarray:
    dst = np.pad(dst, max_sh)
    cor = cv2.matchTemplate(src.astype(np.float32), dst.astype(np.float32), cv2.TM_CCOEFF_NORMED)
    if not len(np.unique(cor)) > 1:
        return np.array([0, 0])
    cent = np.floor(np.array(cor.shape) / 2)
    if local:
        cor_ma = cv2.dilate(cor, np.ones((3, 3)))
        maxs = np.array(np.nonzero(cor_ma == cor))
        dev = ((maxs - cent[:, np.newaxis]) ** 2).sum(axis=0)
        imax = maxs[:, np.argmin(dev)]
    else:
        imax = np.unravel_index(np.argmax(cor), cor.shape)
    if subpixel:
        x0 = np.arange(max(imax[0] - 5, 0), min(imax[0] + 6, cor.shape[0]))
        x1 = np.arange(max(imax[1] - 5, 0), min(imax[1] + 6, cor.shape[1]))
        y0 = cor[x0, imax[1]]
        y1 = cor[imax[0], x1]
        p0 = np.polyfit(x0, y0, 2)
        p1 = np.polyfit(x1, y1, 2)
        imax = np.array([-0.5 * p0[1] / p0[0], -0.5 * p1[1] / p1[0]])
        # m0 = np.roots(np.polyder(p0)) # for higher order polynomial fit
        # m1 = np.roots(np.polyder(p1))
        # m0 = m0[np.argmin(np.abs(m0 - imax[0]))]
        # m1 = m1[np.argmin(np.abs(m1 - imax[1]))]
        # imax = np.array([m0, m1])
    sh = cent - imax
    return sh



[docs]
def check_temp(fm: np.ndarray, max_sh: int) -> float:
    """
    Compute the circularity metric for a frame.

    Parameters
    ----------
    fm : np.ndarray
        Input frame.
    max_sh : int
        Amount of zero padding when computing the comparison image.

    Returns
    -------
    circularity : float
        The circularity metric, will be `0` if the comparison image has more
        than one region with values `< 1`.

    See Also
    --------
    estimate_motion
    """
    fm_pad = np.pad(fm, max_sh)
    cor = cv2.matchTemplate(fm.astype(np.float32), fm_pad.astype(np.float32), cv2.TM_SQDIFF_NORMED)
    conts = cv2.findContours(
        (cor < 1).astype(np.uint8), cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE
    )[0]
    if len(conts) != 1:
        return 0
    cont = conts[0]
    perimeter = cv2.arcLength(cont, True)
    if perimeter <= 0:
        return 0
    area = cv2.contourArea(cont)
    circularity = 4 * np.pi * (area / (perimeter**2))
    return circularity



def apply_shifts(varr: xr.DataArray, shifts: xr.DataArray, fill: float = np.nan) -> xr.DataArray:
    sh_dim = shifts.coords["shift_dim"].values.tolist()
    varr_sh = xr.apply_ufunc(
        shift_perframe,
        varr.chunk(dict.fromkeys(sh_dim, -1)),
        shifts,
        input_core_dims=[sh_dim, ["shift_dim"]],
        output_core_dims=[sh_dim],
        vectorize=True,
        dask="parallelized",
        kwargs={"fill": fill},
        output_dtypes=[varr.dtype],
    )
    return varr_sh


def shift_perframe(fm: np.ndarray, sh: np.ndarray, fill: float = np.nan) -> np.ndarray:
    if np.isnan(fm).all():
        return fm
    sh = np.around(sh).astype(int)
    fm = np.roll(fm, sh, axis=np.arange(fm.ndim))
    index = [slice(None) for _ in range(fm.ndim)]
    for ish, s in enumerate(sh):
        index = [slice(None) for _ in range(fm.ndim)]
        if s > 0:
            index[ish] = slice(None, s)
            fm[tuple(index)] = fill
        elif s == 0:
            continue
        elif s < 0:
            index[ish] = slice(s, None)
            fm[tuple(index)] = fill
    return fm


def get_mask(fm: np.ndarray, bin_thres: float, bin_wnd: int) -> np.ndarray:
    return cv2.adaptiveThreshold(
        fm,
        1,
        cv2.ADAPTIVE_THRESH_MEAN_C,
        cv2.THRESH_BINARY,
        bin_wnd,
        -bin_thres,
    ).astype(bool)



[docs]
def apply_transform(
    varr: xr.DataArray, trans: xr.DataArray, fill: float = 0, mesh_size: tuple[int, int] = None
) -> xr.DataArray:
    """
    Apply necessary transform to correct for motion.

    This function can correct for both rigid and non-rigid motion depending on
    the number of dimensions of input `trans`.

    Parameters
    ----------
    varr : xr.DataArray
        Input array representing movie data.
    trans : xr.DataArray
        Estimated motion, if `trans.ndim > 2` then it is interpreted as shifts
        of control points of mesh grid, and BSpline transform will be
        constructed. Otherwise it is interpreted as shifts in each direction of
        rigid translation.
    fill : int, optional
        Values used to fill in missing pixels (outside field of view). By default
        `0`.
    mesh_size : tuple[int, int], optional
        `mesh_size` parameter used when estimating motion. Only used if
        `trans.ndim > 2`. If `None` and `trans.ndim > 2` then one will be
        computed using :func:`get_mesh_size`. By default `None`.

    Returns
    -------
    varr_sh : xr.DataArray
        Movie data after transform.
    """
    sh_dim = trans.coords["shift_dim"].values.tolist()
    if "grid0" in trans.dims:
        fm0 = varr.isel(frame=0).values
        if mesh_size is None:
            mesh_size = get_mesh_size(fm0)
        param = get_bspline_param(fm0, mesh_size)
        mdim = ["shift_dim", "grid0", "grid1"]
    else:
        param = None
        mdim = ["shift_dim"]
    varr_sh = xr.apply_ufunc(
        transform_perframe,
        varr.chunk(dict.fromkeys(sh_dim, -1)),
        trans,
        input_core_dims=[sh_dim, mdim],
        output_core_dims=[sh_dim],
        vectorize=True,
        dask="parallelized",
        kwargs={"fill": fill, "param": param},
        output_dtypes=[varr.dtype],
    )
    return varr_sh




[docs]
def transform_perframe(
    fm: np.ndarray,
    tx_coef: np.ndarray,
    fill: float = 0,
    param: np.ndarray | None = None,
    mesh_size: tuple[int, int] | None = None,
) -> np.ndarray:
    """
    Transform a single frame.

    Parameters
    ----------
    fm : np.ndarray
        Frame to be transformed.
    tx_coef : np.ndarray
        Coefficient of transformation. If `tx_coef.ndim > 1`, then it is
        interpreted as BSpline transform coefficients. Otherwise it is
        interpreted as rigid translations.
    fill : int, optional
        Values used to fill in missing pixels (outside field of view). By
        default `0`.
    param : np.ndarray, optional
        Fixed parameters defining the BSpline transform. Only used if
        `tx_coef.ndim > 1`. By default `None`.
    mesh_size : tuple[int, int], optional
        `mesh_size` parameter used to estimate motion. If `None` and
        `tx_coef.ndim > 1`, then one will be computed using
        :func:`get_mesh_size`. By default `None`.

    Returns
    -------
    fm : np.ndarray
        The frame after transform.
    """
    if tx_coef.ndim == 1:
        # Rigid translation via cv2.warpAffine (much faster than sitk.Resample
        # for a bilinear warp). `tx_coef` is (height, width): a positive shift
        # moves content toward +height/+width.
        warp = np.array([[1, 0, tx_coef[1]], [0, 1, tx_coef[0]]], dtype=np.float32)
        out = cv2.warpAffine(
            np.asarray(fm, dtype=np.float32),
            warp,
            (fm.shape[1], fm.shape[0]),
            flags=cv2.INTER_LINEAR,
            borderMode=cv2.BORDER_CONSTANT,
            borderValue=float(fill),
        )
        return out.astype(fm.dtype, copy=False)
    if param is None:
        if mesh_size is None:
            mesh_size = get_mesh_size(fm)
        param = get_bspline_param(fm, mesh_size)
    tx = sitk.BSplineTransform([sitk.GetImageFromArray(a) for a in tx_coef])
    tx.SetFixedParameters(param)
    fm = sitk.GetImageFromArray(fm)
    fm = sitk.Resample(fm, fm, tx, sitk.sitkLinear, fill)
    return sitk.GetArrayFromImage(fm)




[docs]
def get_bspline_param(img: np.ndarray, mesh_size: tuple[int, int]) -> np.ndarray:
    """
    Compute fixed parameters for the BSpline transform given a frame and mesh size.

    Parameters
    ----------
    img : np.ndarray
        Input frame.
    mesh_size : tuple[int, int]
        Number of control points for the BSpline mesh.

    Returns
    -------
    param : np.ndarray
        Fixed parameters of a BSpline transform.
    """
    return sitk.BSplineTransformInitializer(
        image1=sitk.GetImageFromArray(img), transformDomainMeshSize=mesh_size
    ).GetFixedParameters()




[docs]
def get_mesh_size(fm: np.ndarray) -> np.ndarray:
    """
    Compute suitable mesh size given a frame.

    The computed mesh size will result in approximately 100 pixels per
    patch/control point in each direction.

    Parameters
    ----------
    fm : np.ndarray
        The input frame.

    Returns
    -------
    mesh_size : np.ndarray
        The auto determined mesh size.
    """
    return (int(np.around(fm.shape[0] / 100)), int(np.around(fm.shape[1] / 100)))