Source code for pyflowreg.core.optical_flow

"""
Optical Flow Implementation
============================

This module implements the variational optical flow computation using
a pyramid-based multi-scale approach with gradient constancy assumption.

This is the default 'flowreg' backend implementation that maintains
compatibility with the MATLAB Flow-Registration toolbox.

Functions
---------
get_displacement
    Main API function for computing optical flow between two frames
get_motion_tensor_gc
    Compute motion tensor components for gradient constancy
get_motion_tensor_gray
    Compute motion tensor components for gray-value constancy
get_motion_tensor_cs
    Compute motion tensor components for census constancy
imregister_wrapper
    Warp an image using computed displacement fields
warpingDepth
    Calculate pyramid depth based on image dimensions
add_boundary
    Add boundary padding to arrays

Notes
-----
The implementation uses a coarse-to-fine pyramid scheme where flow is
computed at progressively finer resolutions, with each level initialized
from the previous coarser level.

See Also
--------
pyflowreg.core.level_solver.compute_flow : Low-level flow solver
"""

import cv2
import numpy as np
from scipy.ndimage import median_filter

from pyflowreg.core.level_solver import compute_flow, compute_flow_gnc
from pyflowreg.core.warping import imregister_wrapper, warpingDepth
from pyflowreg.util.resize_util import imresize_fused_gauss_cubic as resize



[docs]
def add_boundary(f):
    """
    Add 1-pixel boundary padding with edge replication.

    Pads array with 1 pixel on all sides by replicating edge values,
    implementing Neumann boundary conditions for the flow solver.

    Parameters
    ----------
    f : np.ndarray
        Input array to pad

    Returns
    -------
    padded : np.ndarray
        Padded array with shape increased by 2 in each dimension

    Notes
    -----
    Uses np.pad with mode='edge', which replicates the values at the edges
    to provide Neumann (zero-derivative) boundary conditions.
    """
    return np.pad(f, 1, mode="edge")




[docs]
def get_motion_tensor_gc(f1, f2, hy, hx):
    """
    Compute motion tensor components for gradient constancy assumption.

    Calculates the motion tensor components that describe the linearized
    optical flow constraints under the gradient constancy assumption, where
    image gradients are assumed to remain constant between frames. The motion
    tensor encodes motion through temporal derivatives and frame-averaged
    spatial derivatives between f1 and f2.

    Parameters
    ----------
    f1 : ndarray
        Reference frame (2D array).
    f2 : ndarray
        Moving frame (2D array).
    hy : float
        Spatial grid spacing in y-direction.
    hx : float
        Spatial grid spacing in x-direction.

    Returns
    -------
    J11, J22, J33, J12, J13, J23 : ndarray
        Motion tensor components used in the optical flow solver. These
        components encode the linearized gradient constancy constraints
        with adaptive regularization based on local gradient structure.

    Notes
    -----
    The gradient constancy assumption extends the classic brightness constancy
    by requiring that spatial gradients also remain constant during motion.
    This provides additional robustness in textured regions.

    The tensor components are computed with adaptive regularization that
    weights contributions based on local gradient magnitudes, making the
    estimation robust to noise while preserving motion details.

    References
    ----------
    .. [2] Brox, T., Bruhn, A., Papenberg, N., and Weickert, J. "High
       Accuracy Optical Flow Estimation Based on a Theory for Warping",
       ECCV 2004.
    .. [3] Flotho, P., et al. "Software for Non-Parametric Image
       Registration of 2-Photon Imaging Data", J. Biophotonics, 2022.
    """
    f1p = np.pad(f1, ((1, 1), (1, 1)), mode="symmetric")
    f2p = np.pad(f2, ((1, 1), (1, 1)), mode="symmetric")
    _, fx1p = np.gradient(f1p, hy, hx)
    _, fx2p = np.gradient(f2p, hy, hx)
    fx = 0.5 * (fx1p + fx2p)
    ft = f2p - f1p
    fx = np.pad(fx[1:-1, 1:-1], 1, mode="symmetric")
    ft = np.pad(ft[1:-1, 1:-1], 1, mode="symmetric")

    tmp_grad = np.gradient(fx, hy, hx)
    fxy = tmp_grad[0]
    ft_grad = np.gradient(ft, hy, hx)
    fxt = ft_grad[1]
    fyt = ft_grad[0]

    def gradient2(f, hx_, hy_):
        fxx = np.zeros_like(f)
        fyy = np.zeros_like(f)
        fxx[1:-1, 1:-1] = (f[1:-1, 0:-2] - 2 * f[1:-1, 1:-1] + f[1:-1, 2:]) / (hx_**2)
        fyy[1:-1, 1:-1] = (f[0:-2, 1:-1] - 2 * f[1:-1, 1:-1] + f[2:, 1:-1]) / (hy_**2)
        return fxx, fyy

    # gradient2's first spacing scales column (x) second differences and the
    # second scales row (y) second differences.
    fxx1, fyy1 = gradient2(f1p, hx, hy)
    fxx2, fyy2 = gradient2(f2p, hx, hy)
    fxx = 0.5 * (fxx1 + fxx2)
    fyy = 0.5 * (fyy1 + fyy2)
    reg_x = 1.0 / ((np.sqrt(fxx**2 + fxy**2) ** 2) + 1e-6)
    reg_y = 1.0 / ((np.sqrt(fxy**2 + fyy**2) ** 2) + 1e-6)
    J11 = reg_x * fxx**2 + reg_y * fxy**2
    J22 = reg_x * fxy**2 + reg_y * fyy**2
    J33 = reg_x * fxt**2 + reg_y * fyt**2
    J12 = reg_x * fxx * fxy + reg_y * fxy * fyy
    J13 = reg_x * fxx * fxt + reg_y * fxy * fyt
    J23 = reg_x * fxy * fxt + reg_y * fyy * fyt
    for arr in [J11, J22, J33, J12, J13, J23]:
        arr[:, 0] = 0
        arr[:, -1] = 0
        arr[0, :] = 0
        arr[-1, :] = 0
    return J11, J22, J33, J12, J13, J23




[docs]
def get_motion_tensor_gray(f1, f2, hy, hx):
    """
    Compute motion tensor components for gray-value constancy assumption.

    Calculates the motion tensor components that encode the linearized
    optical flow constraints under the classic brightness (gray-value)
    constancy assumption. Spatial derivatives are averaged between frames,
    while the temporal term measures residual brightness changes after
    warping.

    Parameters
    ----------
    f1 : ndarray
        Reference frame (2D array).
    f2 : ndarray
        Moving frame (2D array).
    hy : float
        Spatial grid spacing in y-direction.
    hx : float
        Spatial grid spacing in x-direction.

    Returns
    -------
    J11, J22, J33, J12, J13, J23 : ndarray
        Motion tensor components used by the optical flow solver. These
        components encode the linearized gray-value constancy constraints
        using averaged spatial gradients and the inter-frame difference.

    Notes
    -----
    Gray-value constancy assumes that pixel intensities remain unchanged
    between frames. It is sensitive to lighting changes but provides a
    simple and fast data term that works well when illumination is stable.

    Gradients are computed on symmetrically padded images to enforce
    Neumann boundary conditions, with boundary entries zeroed to avoid
    wrap-around artifacts.
    """
    f1p = np.pad(f1, ((1, 1), (1, 1)), mode="symmetric")
    f2p = np.pad(f2, ((1, 1), (1, 1)), mode="symmetric")

    fy1, fx1 = np.gradient(f1p, hy, hx)
    fy2, fx2 = np.gradient(f2p, hy, hx)

    fx = 0.5 * (fx1 + fx2)
    fy = 0.5 * (fy1 + fy2)
    ft = f2p - f1p

    fx = np.pad(fx[1:-1, 1:-1], 1, mode="symmetric")
    fy = np.pad(fy[1:-1, 1:-1], 1, mode="symmetric")
    ft = np.pad(ft[1:-1, 1:-1], 1, mode="symmetric")

    J11 = fx * fx
    J22 = fy * fy
    J33 = ft * ft
    J12 = fx * fy
    J13 = fx * ft
    J23 = fy * ft

    for arr in [J11, J22, J33, J12, J13, J23]:
        arr[:, 0] = 0
        arr[:, -1] = 0
        arr[0, :] = 0
        arr[-1, :] = 0

    return J11, J22, J33, J12, J13, J23




[docs]
def get_motion_tensor_cs(f1, f2, hy, hx, eps=None):
    """
    Compute motion tensor components for census-based constancy assumption.

    Builds a robust motion tensor using a smoothed census transform that
    matches the relative ordering of neighboring pixels instead of raw
    intensity values. The tensor aggregates directional differences over a
    3x3 neighborhood to enforce illumination-invariant constraints between
    f1 and f2.

    Parameters
    ----------
    f1 : ndarray
        Reference frame (2D array).
    f2 : ndarray
        Moving frame (2D array).
    hy : float
        Spatial grid spacing in y-direction.
    hx : float
        Spatial grid spacing in x-direction.
    eps : float, optional
        Smoothing width for the smoothed Heaviside function applied to
        directional differences ``r = (neighbor - center) / dist``. If None,
        uses ``0.1 / 255.0``, matching the Hafner/Demetz/Weickert
        ``epsilon = 0.1`` convention for images scaled from ``[0, 255]`` to
        approximately ``[0, 1]``. When ``hx`` or ``hy`` are physical units
        rather than pixel-like units, callers may need to scale ``eps``
        consistently.

    Returns
    -------
    J11, J22, J33, J12, J13, J23 : ndarray
        Motion tensor components used in the optical flow solver. These
        components encode the linearized census constancy constraints,
        averaged over the eight-connected neighborhood for robustness.

    Notes
    -----
    The hard census transform is invariant to global monotonically increasing
    grey-value transforms because it depends only on ordering. This
    implementation uses finite differences, Gaussian-preprocessed inputs, a
    smoothed Heaviside function, and a linearized motion tensor, so invariance
    is approximate.

    Additive offsets cancel exactly in neighbor-center differences. Positive
    multiplicative changes are approximately handled only when ``eps`` is small
    relative to the directional-difference scale, or when ``eps`` is scaled
    consistently with image intensity scale. Gamma and other nonlinear
    monotone transforms preserve hard ordering but not exact smoothed
    Heaviside values.

    References
    ----------
    .. [1] Hafner, D., Demetz, O., and Weickert, J. "Why is the Census
       Transform Good for Robust Optic Flow Computation?", SSVM 2013.
    """
    if eps is None:
        eps = 0.1 / 255.0
    eps2 = eps * eps

    H, W = f1.shape
    f1p = np.pad(f1, ((1, 1), (1, 1)), mode="symmetric")
    f2p = np.pad(f2, ((1, 1), (1, 1)), mode="symmetric")
    center1 = f1p[1:-1, 1:-1]
    center2 = f2p[1:-1, 1:-1]

    offsets = [
        (dy, dx) for dy in (-1, 0, 1) for dx in (-1, 0, 1) if not (dy == 0 and dx == 0)
    ]
    N = float(len(offsets))
    scale = 2.0 / N

    J11 = np.zeros_like(f1p, dtype=np.float64)
    J22 = np.zeros_like(f1p, dtype=np.float64)
    J33 = np.zeros_like(f1p, dtype=np.float64)
    J12 = np.zeros_like(f1p, dtype=np.float64)
    J13 = np.zeros_like(f1p, dtype=np.float64)
    J23 = np.zeros_like(f1p, dtype=np.float64)

    for dy, dx in offsets:
        dist = float(np.sqrt((hy * dy) * (hy * dy) + (hx * dx) * (hx * dx)))

        neigh1 = f1p[1 + dy : 1 + dy + H, 1 + dx : 1 + dx + W]
        neigh2 = f2p[1 + dy : 1 + dy + H, 1 + dx : 1 + dx + W]

        r1_core = (neigh1 - center1) / dist
        r2_core = (neigh2 - center2) / dist

        s1_core = 0.5 * (1.0 + r1_core / np.sqrt(r1_core * r1_core + eps2))
        s2_core = 0.5 * (1.0 + r2_core / np.sqrt(r2_core * r2_core + eps2))

        s1 = np.pad(s1_core, 1, mode="edge")
        s2 = np.pad(s2_core, 1, mode="edge")

        sy1, sx1 = np.gradient(s1, hy, hx)
        sy2, sx2 = np.gradient(s2, hy, hx)
        sx = 0.5 * (sx1 + sx2)
        sy = 0.5 * (sy1 + sy2)
        st = s2 - s1

        J11 += sx * sx
        J22 += sy * sy
        J33 += st * st
        J12 += sx * sy
        J13 += sx * st
        J23 += sy * st

    for arr in (J11, J22, J33, J12, J13, J23):
        arr *= scale
        arr[:, 0] = 0
        arr[:, -1] = 0
        arr[0, :] = 0
        arr[-1, :] = 0

    return J11, J22, J33, J12, J13, J23




[docs]
def level_solver(
    J11,
    J22,
    J33,
    J12,
    J13,
    J23,
    weight,
    u,
    v,
    alpha,
    iterations,
    update_lag,
    verbose,
    a_data,
    a_smooth,
    hx,
    hy,
    gnc_beta=None,
):
    if gnc_beta is None:
        result = compute_flow(
            J11,
            J22,
            J33,
            J12,
            J13,
            J23,
            weight=weight,
            u=u,
            v=v,
            alpha_x=alpha[0],
            alpha_y=alpha[1],
            iterations=iterations,
            update_lag=update_lag,
            a_data=a_data,
            a_smooth=a_smooth,
            hx=hx,
            hy=hy,
        )
    else:
        result = compute_flow_gnc(
            J11,
            J22,
            J33,
            J12,
            J13,
            J23,
            weight=weight,
            u=u,
            v=v,
            alpha_x=alpha[0],
            alpha_y=alpha[1],
            iterations=iterations,
            update_lag=update_lag,
            a_data=a_data,
            a_smooth=a_smooth,
            hx=hx,
            hy=hy,
            gnc_beta=gnc_beta,
        )
    du = result[:, :, 0]
    dv = result[:, :, 1]
    return du, dv




[docs]
def normalize_gnc_schedule(gnc_schedule):
    """Validate and normalize an optional GNC schedule."""
    if gnc_schedule is None:
        return None

    schedule = np.asarray(gnc_schedule, dtype=np.float64)
    if schedule.ndim != 1:
        raise ValueError("gnc_schedule must be a 1D sequence of stage weights")
    if schedule.size < 2:
        raise ValueError("gnc_schedule must contain at least two stages")
    if np.any(schedule < 0.0) or np.any(schedule > 1.0):
        raise ValueError("gnc_schedule entries must lie in [0, 1]")
    if not np.all(np.diff(schedule) >= 0.0):
        raise ValueError("gnc_schedule must be monotone nondecreasing")
    if not np.isclose(schedule[0], 0.0):
        raise ValueError("gnc_schedule must start at 0.0")
    if not np.isclose(schedule[-1], 1.0):
        raise ValueError("gnc_schedule must end at 1.0")
    return np.ascontiguousarray(schedule)




[docs]
def normalize_warping_steps(warping_steps):
    """Validate and normalize an optional number of warping steps."""
    if warping_steps is None:
        return None

    steps = int(warping_steps)
    if steps < 1:
        raise ValueError("warping_steps must be a positive integer")
    return steps



def _resolve_motion_tensor_func(const_assumption):
    """
    Resolve a constancy-assumption selector to a motion tensor function.

    The default ``gc`` path is the MATLAB Flow-Registration behavior. Census
    and gray-value constancy are explicit opt-in alternatives.
    """
    if hasattr(const_assumption, "value"):
        const_assumption = const_assumption.value

    key = str(const_assumption).strip().lower()
    tensor_funcs = {
        "gc": get_motion_tensor_gc,
        "gradient": get_motion_tensor_gc,
        "gray": get_motion_tensor_gray,
        "brightness": get_motion_tensor_gray,
        "cs": get_motion_tensor_cs,
        "census": get_motion_tensor_cs,
    }

    try:
        return tensor_funcs[key]
    except KeyError as e:
        supported = "', '".join(sorted(tensor_funcs))
        raise ValueError(
            f"Unknown constancy assumption: '{const_assumption}'. "
            f"Supported values are: '{supported}'."
        ) from e


def _solve_displacement_stage(
    fixed,
    moving,
    alpha,
    update_lag,
    iterations,
    min_level,
    levels,
    eta,
    a_smooth,
    a_data_arr,
    uv,
    weight,
    level_solver_backend,
    motion_tensor_func,
    gnc_beta,
):
    """Solve one full pyramid pass for a fixed GNC stage."""
    m, n, n_channels = fixed.shape
    f1_low = fixed
    f2_low = moving
    max_level_y = warpingDepth(eta, levels, m, m)
    max_level_x = warpingDepth(eta, levels, n, n)
    max_level = min(max_level_x, max_level_y) * 4
    max_level_y = min(max_level_y, max_level)
    max_level_x = min(max_level_x, max_level)
    if max(max_level_x, max_level_y) <= min_level:
        min_level = max(max_level_x, max_level_y) - 1
    if min_level < 0:
        min_level = 0
    if uv is not None:
        u_init = uv[:, :, 0]
        v_init = uv[:, :, 1]
    else:
        u_init = np.zeros((m, n), dtype=np.float64)
        v_init = np.zeros((m, n), dtype=np.float64)
    u = None
    v = None
    for i in range(max(max_level_x, max_level_y), min_level - 1, -1):
        level_size = (
            int(round(m * eta ** (min(i, max_level_y)))),
            int(round(n * eta ** (min(i, max_level_x)))),
        )
        f1_level = resize(f1_low, level_size)
        f2_level = resize(f2_low, level_size)
        if f1_level.ndim == 2:
            f1_level = f1_level[:, :, np.newaxis]
            f2_level = f2_level[:, :, np.newaxis]
        # Grid spacings of this pyramid level in full-resolution pixel units:
        # h_row scales row (y) differences, h_col scales column (x)
        # differences. u is the horizontal (column) and v the vertical (row)
        # displacement, both in full-resolution pixel units.
        h_row = float(m) / f1_level.shape[0]
        h_col = float(n) / f1_level.shape[1]
        if i == max(max_level_x, max_level_y):
            u = add_boundary(resize(u_init, level_size))
            v = add_boundary(resize(v_init, level_size))
            tmp = f2_level.copy()
        else:
            u = add_boundary(resize(u[1:-1, 1:-1], level_size))
            v = add_boundary(resize(v[1:-1, 1:-1], level_size))
            tmp = imregister_wrapper(
                f2_level,
                u[1:-1, 1:-1] / h_col,
                v[1:-1, 1:-1] / h_row,
                f1_level,
            )
        if tmp.ndim == 2:
            tmp = tmp[:, :, np.newaxis]
        u = np.ascontiguousarray(u)
        v = np.ascontiguousarray(v)
        J_size = (f1_level.shape[0] + 2, f1_level.shape[1] + 2, n_channels)
        J11 = np.zeros(J_size, dtype=np.float64)
        J22 = np.zeros(J_size, dtype=np.float64)
        J33 = np.zeros(J_size, dtype=np.float64)
        J12 = np.zeros(J_size, dtype=np.float64)
        J13 = np.zeros(J_size, dtype=np.float64)
        J23 = np.zeros(J_size, dtype=np.float64)
        for ch in range(n_channels):
            J11_ch, J22_ch, J33_ch, J12_ch, J13_ch, J23_ch = motion_tensor_func(
                f1_level[:, :, ch], tmp[:, :, ch], h_row, h_col
            )
            J11[:, :, ch] = J11_ch
            J22[:, :, ch] = J22_ch
            J33[:, :, ch] = J33_ch
            J12[:, :, ch] = J12_ch
            J13[:, :, ch] = J13_ch
            J23[:, :, ch] = J23_ch

        weight_level = resize(weight, f1_level.shape[:2])
        weight_level = cv2.copyMakeBorder(
            weight_level, 1, 1, 1, 1, borderType=cv2.BORDER_CONSTANT, value=0.0
        )
        if weight_level.ndim < 3:
            weight_level = weight_level[:, :, np.newaxis]

        if i == min_level:
            alpha_scaling = 1
        else:
            alpha_scaling = eta ** (-0.5 * i)

        alpha_tmp = [alpha_scaling * alpha[j] for j in range(len(alpha))]

        # Use custom level solver if provided, otherwise use default
        solver_func = (
            level_solver_backend if level_solver_backend is not None else level_solver
        )

        du, dv = solver_func(
            np.ascontiguousarray(J11),
            np.ascontiguousarray(J22),
            np.ascontiguousarray(J33),
            np.ascontiguousarray(J12),
            np.ascontiguousarray(J13),
            np.ascontiguousarray(J23),
            np.ascontiguousarray(weight_level),
            u,
            v,
            alpha_tmp,
            iterations,
            update_lag,
            0,
            a_data_arr,
            a_smooth,
            # The solver's hx scales column (x) differences and hy scales row
            # (y) differences; passing (h_row, h_col) here would swap the
            # smoothness metric relative to the data term and warping above.
            h_col,
            h_row,
            gnc_beta,
        )
        if min(level_size) > 5:
            du[1:-1, 1:-1] = median_filter(du[1:-1, 1:-1], size=(5, 5), mode="mirror")
            dv[1:-1, 1:-1] = median_filter(dv[1:-1, 1:-1], size=(5, 5), mode="mirror")
        u = u + du
        v = v + dv
    w = np.zeros((u.shape[0] - 2, u.shape[1] - 2, 2), dtype=np.float64)
    w[:, :, 0] = u[1:-1, 1:-1]
    w[:, :, 1] = v[1:-1, 1:-1]
    if min_level > 0:
        w = cv2.resize(w, (n, m), interpolation=cv2.INTER_CUBIC)
    return w


def _solve_displacement_stage_gnc(
    fixed,
    moving,
    alpha,
    update_lag,
    iterations,
    min_level,
    levels,
    eta,
    a_smooth,
    a_data_arr,
    uv,
    weight,
    level_solver_backend,
    motion_tensor_func,
    gnc_beta,
    warping_steps,
):
    """Solve one GNC stage with repeated warp/relinearize steps per level."""
    m, n, n_channels = fixed.shape
    f1_low = fixed
    f2_low = moving
    max_level_y = warpingDepth(eta, levels, m, m)
    max_level_x = warpingDepth(eta, levels, n, n)
    max_level = min(max_level_x, max_level_y) * 4
    max_level_y = min(max_level_y, max_level)
    max_level_x = min(max_level_x, max_level)
    if max(max_level_x, max_level_y) <= min_level:
        min_level = max(max_level_x, max_level_y) - 1
    if min_level < 0:
        min_level = 0
    if uv is not None:
        u_init = uv[:, :, 0]
        v_init = uv[:, :, 1]
    else:
        u_init = np.zeros((m, n), dtype=np.float64)
        v_init = np.zeros((m, n), dtype=np.float64)

    solver_func = (
        level_solver_backend if level_solver_backend is not None else level_solver
    )
    u = None
    v = None
    for i in range(max(max_level_x, max_level_y), min_level - 1, -1):
        level_size = (
            int(round(m * eta ** (min(i, max_level_y)))),
            int(round(n * eta ** (min(i, max_level_x)))),
        )
        f1_level = resize(f1_low, level_size)
        f2_level = resize(f2_low, level_size)
        if f1_level.ndim == 2:
            f1_level = f1_level[:, :, np.newaxis]
            f2_level = f2_level[:, :, np.newaxis]
        # Grid spacings of this pyramid level in full-resolution pixel units:
        # h_row scales row (y) differences, h_col scales column (x)
        # differences. u is the horizontal (column) and v the vertical (row)
        # displacement, both in full-resolution pixel units.
        h_row = float(m) / f1_level.shape[0]
        h_col = float(n) / f1_level.shape[1]

        if i == max(max_level_x, max_level_y):
            u = add_boundary(resize(u_init, level_size))
            v = add_boundary(resize(v_init, level_size))
        else:
            u = add_boundary(resize(u[1:-1, 1:-1], level_size))
            v = add_boundary(resize(v[1:-1, 1:-1], level_size))

        u = np.ascontiguousarray(u)
        v = np.ascontiguousarray(v)

        weight_level = resize(weight, f1_level.shape[:2])
        weight_level = cv2.copyMakeBorder(
            weight_level, 1, 1, 1, 1, borderType=cv2.BORDER_CONSTANT, value=0.0
        )
        if weight_level.ndim < 3:
            weight_level = weight_level[:, :, np.newaxis]
        weight_level = np.ascontiguousarray(weight_level)

        if i == min_level:
            alpha_scaling = 1
        else:
            alpha_scaling = eta ** (-0.5 * i)
        alpha_tmp = [alpha_scaling * alpha[j] for j in range(len(alpha))]

        for _ in range(warping_steps):
            tmp = imregister_wrapper(
                f2_level,
                u[1:-1, 1:-1] / h_col,
                v[1:-1, 1:-1] / h_row,
                f1_level,
            )
            if tmp.ndim == 2:
                tmp = tmp[:, :, np.newaxis]

            J_size = (f1_level.shape[0] + 2, f1_level.shape[1] + 2, n_channels)
            J11 = np.zeros(J_size, dtype=np.float64)
            J22 = np.zeros(J_size, dtype=np.float64)
            J33 = np.zeros(J_size, dtype=np.float64)
            J12 = np.zeros(J_size, dtype=np.float64)
            J13 = np.zeros(J_size, dtype=np.float64)
            J23 = np.zeros(J_size, dtype=np.float64)
            for ch in range(n_channels):
                J11_ch, J22_ch, J33_ch, J12_ch, J13_ch, J23_ch = motion_tensor_func(
                    f1_level[:, :, ch], tmp[:, :, ch], h_row, h_col
                )
                J11[:, :, ch] = J11_ch
                J22[:, :, ch] = J22_ch
                J33[:, :, ch] = J33_ch
                J12[:, :, ch] = J12_ch
                J13[:, :, ch] = J13_ch
                J23[:, :, ch] = J23_ch

            du, dv = solver_func(
                np.ascontiguousarray(J11),
                np.ascontiguousarray(J22),
                np.ascontiguousarray(J33),
                np.ascontiguousarray(J12),
                np.ascontiguousarray(J13),
                np.ascontiguousarray(J23),
                weight_level,
                u,
                v,
                alpha_tmp,
                iterations,
                update_lag,
                0,
                a_data_arr,
                a_smooth,
                # The solver's hx scales column (x) differences and hy scales
                # row (y) differences; passing (h_row, h_col) here would swap
                # the smoothness metric relative to the data term and warping.
                h_col,
                h_row,
                gnc_beta,
            )
            u = u + du
            v = v + dv
            if min(level_size) > 5:
                u = add_boundary(
                    median_filter(u[1:-1, 1:-1], size=(5, 5), mode="mirror")
                )
                v = add_boundary(
                    median_filter(v[1:-1, 1:-1], size=(5, 5), mode="mirror")
                )

    w = np.zeros((u.shape[0] - 2, u.shape[1] - 2, 2), dtype=np.float64)
    w[:, :, 0] = u[1:-1, 1:-1]
    w[:, :, 1] = v[1:-1, 1:-1]
    if min_level > 0:
        w = cv2.resize(w, (n, m), interpolation=cv2.INTER_CUBIC)
    return w



[docs]
def get_displacement(
    fixed,
    moving,
    alpha=(2, 2),
    update_lag=5,
    iterations=50,
    min_level=0,
    levels=50,
    eta=0.8,
    a_smooth=1.0,
    a_data=0.45,
    const_assumption="gc",
    uv=None,
    weight=None,
    level_solver_backend=None,
    gnc_schedule=None,
    warping_steps=None,
):
    """
    Compute optical flow displacement field using variational approach.

    This function implements the main pyramid-based variational optical flow
    algorithm using gradient constancy assumption with non-linear diffusion
    regularization. Flow is computed from coarse to fine scales, with each
    level initialized from the upsampled result of the previous coarser level.

    Parameters
    ----------
    fixed : np.ndarray
        Reference (fixed) image, shape (H, W) or (H, W, C)
    moving : np.ndarray
        Moving image to register, shape (H, W) or (H, W, C)
    alpha : tuple of float, default=(2, 2)
        Regularization strength (alpha_x, alpha_y) controlling smoothness.
        Larger values enforce smoother flow fields.
    update_lag : int, default=5
        Number of iterations between updates of non-linearity weights (psi).
        Smaller values update more frequently (slower, potentially more accurate).
        Larger values update less frequently (faster convergence).
    iterations : int, default=50
        Number of SOR iterations per pyramid level
    min_level : int, default=0
        Minimum (finest) pyramid level to compute. 0 = full resolution.
    levels : int, default=50
        Maximum number of pyramid levels attempted
    eta : float, default=0.8
        Pyramid downsampling factor per level (0 < eta <= 1).
        Each level is eta times the size of the previous level.
    a_smooth : float, default=1.0
        Exponent for generalized Charbonnier penalty on smoothness term.
    a_data : float, default=0.45
        Exponent for generalized Charbonnier penalty on data term.
    const_assumption : str, default='gc'
        Constancy assumption. Supported values are 'gc'/'gradient',
        'gray'/'brightness', and 'cs'/'census'.
    uv : np.ndarray, optional
        Initial displacement field (H, W, 2) with [u, v] components.
    weight : np.ndarray or list, optional
        Channel weights for multi-channel registration.
    level_solver_backend : Callable, optional
        Custom level solver function to use instead of the default CPU solver.
    gnc_schedule : sequence of float, optional
        Opt-in stage weights interpolating from quadratic (0.0) to fully robust
        (1.0). Each stage reruns the pyramid with the previous stage result used
        as initialization.
    warping_steps : int, optional
        Number of warp/relinearize steps per pyramid level in optional GNC mode.
        If omitted, GNC defaults to 10 steps per level. Ignored when GNC is off.
    """
    assert (
        fixed.ndim == moving.ndim
    ), f"Fixed and moving must have same dimensions: fixed.shape={fixed.shape}, moving.shape={moving.shape}"
    motion_tensor_func = _resolve_motion_tensor_func(const_assumption)
    fixed = fixed.astype(np.float64)
    moving = moving.astype(np.float64)
    if fixed.ndim == 3:
        m, n, n_channels = fixed.shape
    else:
        m, n = fixed.shape
        n_channels = 1
        fixed = fixed[:, :, np.newaxis]
        moving = moving[:, :, np.newaxis]

    if weight is None:
        weight = np.ones((m, n, n_channels), dtype=np.float64) / n_channels
    else:
        weight = weight.astype(np.float64)
        if weight.ndim < 3:
            if weight.ndim == 1:
                if len(weight) < n_channels:
                    default_weight = 1.0 / n_channels
                    weight_expanded = np.full(
                        n_channels, default_weight, dtype=np.float64
                    )
                    weight_expanded[: len(weight)] = weight
                    weight = weight_expanded
                elif len(weight) > n_channels:
                    weight = weight[:n_channels]
                weight = weight / weight.sum()
                weight = np.ones((m, n, n_channels), dtype=np.float64) * weight.reshape(
                    1, 1, -1
                )
            else:
                weight = (
                    np.ones((m, n, n_channels), dtype=np.float64)
                    * weight[..., np.newaxis]
                )

    if not isinstance(a_data, np.ndarray):
        a_data_arr = np.full(n_channels, a_data, dtype=np.float64)
    else:
        a_data_arr = a_data
    a_data_arr = np.ascontiguousarray(a_data_arr)

    gnc_schedule_arr = normalize_gnc_schedule(gnc_schedule)
    warping_steps = normalize_warping_steps(warping_steps)
    if gnc_schedule_arr is None:
        return _solve_displacement_stage(
            fixed,
            moving,
            alpha,
            update_lag,
            iterations,
            min_level,
            levels,
            eta,
            a_smooth,
            a_data_arr,
            uv,
            weight,
            level_solver_backend,
            motion_tensor_func,
            None,
        )

    flow = uv
    effective_warping_steps = 10 if warping_steps is None else warping_steps
    for gnc_beta in gnc_schedule_arr:
        flow = _solve_displacement_stage_gnc(
            fixed,
            moving,
            alpha,
            update_lag,
            iterations,
            min_level,
            levels,
            eta,
            a_smooth,
            a_data_arr,
            flow,
            weight,
            level_solver_backend,
            motion_tensor_func,
            float(gnc_beta),
            effective_warping_steps,
        )
    return flow