unit tests added with updates for JAX and correct functionality

Jammy2211 · Jammy2211 · commit ac9805b528fc · 2026-02-13T11:03:25.000Z
diff --git a/autoarray/inversion/regularization/__init__.py b/autoarray/inversion/regularization/__init__.py
@@ -10,3 +10,4 @@
 from .gaussian_kernel import GaussianKernel
 from .exponential_kernel import ExponentialKernel
 from .matern_kernel import MaternKernel
+from .matern_adaptive_brightness_kernel import MaternAdaptiveBrightnessKernel
diff --git a/autoarray/inversion/regularization/matern_adaptive_brightness_kernel.py b/autoarray/inversion/regularization/matern_adaptive_brightness_kernel.py
@@ -1,52 +1,148 @@
-from autoarray.inversion.regularization.abstract import AbstractRegularization
+from __future__ import annotations
+import numpy as np
+from typing import TYPE_CHECKING
 
-from autoarray.inversion.regularization.matern_kernel import matern_cov_matrix_from
+from autoarray.inversion.regularization.matern_kernel import MaternKernel
 
+if TYPE_CHECKING:
+    from autoarray.inversion.linear_obj.linear_obj import LinearObj
 
-class AdaptiveBrightnessMatern(AbstractRegularization):
+from autoarray.inversion.regularization.matern_kernel import matern_kernel
+
+def matern_cov_matrix_from(
+    scale: float,
+    nu: float,
+    pixel_points,
+    weights=None,
+    xp=np,
+):
+    """
+    Construct the regularization covariance matrix (N x N) using a Matérn kernel,
+    optionally modulated by per-pixel weights.
+
+    If `weights` is provided (shape [N]), the covariance is:
+        C_ij = K(d_ij; scale, nu) * w_i * w_j
+    with a small diagonal jitter added for numerical stability.
+
+    Parameters
+    ----------
+    scale
+        Typical correlation length of the Matérn kernel.
+    nu
+        Smoothness parameter of the Matérn kernel.
+    pixel_points
+        Array-like of shape [N, 2] with (y, x) coordinates (or any 2D coords; only distances matter).
+    weights
+        Optional array-like of shape [N]. If None, treated as all ones.
+    xp
+        Backend (numpy or jax.numpy).
+
+    Returns
+    -------
+    covariance_matrix
+        Array of shape [N, N].
+    """
+
+    # --------------------------------
+    # Pairwise distances (broadcasted)
+    # --------------------------------
+    diff = pixel_points[:, None, :] - pixel_points[None, :, :]  # (N, N, 2)
+    d_ij = xp.sqrt(diff[..., 0] ** 2 + diff[..., 1] ** 2)       # (N, N)
+
+    # --------------------------------
+    # Base Matérn covariance
+    # --------------------------------
+    covariance_matrix = matern_kernel(d_ij, l=scale, v=nu, xp=xp)  # (N, N)
+
+    # --------------------------------
+    # Apply weights: C_ij *= w_i * w_j
+    # (broadcasted outer product, JAX-safe)
+    # --------------------------------
+    if weights is not None:
+        w = xp.asarray(weights)
+        # Ensure shape (N,) -> outer product (N,1)*(1,N) -> (N,N)
+        covariance_matrix = covariance_matrix * (w[:, None] * w[None, :])
+
+    # --------------------------------
+    # Add diagonal jitter (JAX-safe)
+    # --------------------------------
+    pixels = pixel_points.shape[0]
+    covariance_matrix = covariance_matrix + 1e-8 * xp.eye(pixels)
+
+    return covariance_matrix
+
+
+class MaternAdaptiveBrightnessKernel(MaternKernel):
     def __init__(
-            self,
-            coefficient: float = 1.0,
-            scale: float = 1.0,
-            nu: float = 0.5,
-            rho: float = 1.0,
+        self,
+        coefficient: float = 1.0,
+        scale: float = 1.0,
+        nu: float = 0.5,
+        rho: float = 1.0,
     ):
-        super().__init__(coefficient=coefficient, scale=scale, rho=rho)
-        self.nu = nu
+        """
+        Regularization which uses a Matern smoothing kernel to regularize the solution with regularization weights
+        that adapt to the brightness of the source being reconstructed.
+
+        For this regularization scheme, every pixel is regularized with every other pixel. This contrasts many other
+        schemes, where regularization is based on neighboring (e.g. do the pixels share a Delaunay edge?) or computing
+        derivates around the center of the pixel (where nearby pixels are regularization locally in similar ways).
+
+        This makes the regularization matrix fully dense and therefore maybe change the run times of the solution.
+        It also leads to more overall smoothing which can lead to more stable linear inversions.
+
+        For the weighted regularization scheme, each pixel is given an 'effective regularization weight', which is
+        applied when each set of pixel neighbors are regularized with one another. The motivation of this is that
+        different regions of a pixelization's mesh require different levels of regularization (e.g., high smoothing where the
+        no signal is present and less smoothing where it is, see (Nightingale, Dye and Massey 2018)).
+
+        This scheme is not used by Vernardos et al. (2022): https://arxiv.org/abs/2202.09378, but it follows
+        a similar approach.
 
-    def covariance_kernel_weights_from(self, linear_obj: LinearObj) -> np.ndarray:
-        pixel_signals = linear_obj.pixel_signals_from(signal_scale=1.0)
-        return np.exp(-self.rho * (1 - pixel_signals / pixel_signals.max()))
+        A full description of regularization and this matrix can be found in the parent `AbstractRegularization` class.
 
-    def regularization_matrix_from(self, linear_obj: LinearObj) -> np.ndarray:
-        kernel_weights = self.covariance_kernel_weights_from(linear_obj=linear_obj)
+        Parameters
+        ----------
+        coefficient
+            The regularization coefficient which controls the degree of smooth of the inversion reconstruction.
+        scale
+            The typical scale of the exponential regularization pattern.
+        nu
+            Controls the derivative of the regularization pattern (`nu=0.5` is a Gaussian).
+        """
+        super().__init__(coefficient=coefficient, scale=scale, nu=nu)
+        self.rho = rho
+
+    def covariance_kernel_weights_from(self, linear_obj: LinearObj, xp=np) -> np.ndarray:
+        """
+        Returns per-pixel kernel weights that adapt to the reconstructed pixel brightness.
+        """
+        # Assumes linear_obj.pixel_signals_from is xp-aware elsewhere in the codebase.
+        pixel_signals = linear_obj.pixel_signals_from(signal_scale=1.0, xp=xp)
+
+        max_signal = xp.max(pixel_signals)
+        max_signal = xp.maximum(max_signal, 1e-8)  # avoid divide-by-zero (JAX-safe)
+
+        return xp.exp(-self.rho * (1.0 - pixel_signals / max_signal))
+
+    def regularization_matrix_from(self, linear_obj: LinearObj, xp=np) -> np.ndarray:
+        kernel_weights = self.covariance_kernel_weights_from(linear_obj=linear_obj, xp=xp)
+
+        # Follow the xp pattern used in the Matérn kernel module (often `.array` for grids).
+        pixel_points = linear_obj.source_plane_mesh_grid
 
         covariance_matrix = matern_cov_matrix_from(
             scale=self.scale,
-            pixel_points=linear_obj.source_plane_mesh_grid,
+            pixel_points=pixel_points,
             nu=self.nu,
             weights=kernel_weights,
+            xp=xp,
         )
 
-        return self.coefficient * np.linalg.inv(covariance_matrix)
+        return self.coefficient * xp.linalg.inv(covariance_matrix)
 
-    def regularization_weights_from(self, linear_obj: LinearObj) -> np.ndarray:
+    def regularization_weights_from(self, linear_obj: LinearObj, xp=np) -> np.ndarray:
         """
         Returns the regularization weights of this regularization scheme.
-
-        The regularization weights define the level of regularization applied to each parameter in the linear object
-        (e.g. the ``pixels`` in a ``Mapper``).
-
-        For standard regularization (e.g. ``Constant``) are weights are equal, however for adaptive schemes
-        (e.g. ``AdaptiveBrightness``) they vary to adapt to the data being reconstructed.
-
-        Parameters
-        ----------
-        linear_obj
-            The linear object (e.g. a ``Mapper``) which uses these weights when performing regularization.
-
-        Returns
-        -------
-        The regularization weights.
         """
-        return 1.0/self.covariance_kernel_weights_from(linear_obj=linear_obj) #meaningless, but consistent with other regularization schemes
+        return 1.0 / self.covariance_kernel_weights_from(linear_obj=linear_obj, xp=xp)
diff --git a/autoarray/structures/arrays/kernel_2d.py b/autoarray/structures/arrays/kernel_2d.py
@@ -612,7 +612,7 @@ def convolved_image_from(
         image,
         blurring_image,
         jax_method="direct",
-        use_mixed_precision : bool = False,
+        use_mixed_precision: bool = False,
         xp=np,
     ):
         """
diff --git a/test_autoarray/inversion/regularizations/test_matern_adaptive_brightness_kernel.py b/test_autoarray/inversion/regularizations/test_matern_adaptive_brightness_kernel.py
@@ -0,0 +1,55 @@
+import pytest
+
+import autoarray as aa
+import numpy as np
+
+np.set_printoptions(threshold=np.inf)
+
+
+def test__regularization_matrix():
+
+    reg = aa.reg.MaternAdaptiveBrightnessKernel(coefficient=1.0, scale=2.0, nu=2.0, rho=1.0)
+
+    neighbors = np.array(
+        [
+            [1, 4, -1, -1],
+            [2, 4, 0, -1],
+            [3, 4, 5, 1],
+            [5, 2, -1, -1],
+            [5, 0, 1, 2],
+            [2, 3, 4, -1],
+        ]
+    )
+
+    neighbors_sizes = np.array([2, 3, 4, 2, 4, 3])
+    pixel_signals = np.array([1.0, 2.0, 3.0, 4.0, 5.0, 6.0])
+
+    mesh_grid = aa.m.MockMeshGrid(neighbors=neighbors, neighbors_sizes=neighbors_sizes)
+
+    source_plane_mesh_grid = aa.Grid2D.no_mask(
+        values=[[0.1, 0.1], [1.1, 0.6], [2.1, 0.1], [0.4, 1.1], [1.1, 7.1], [2.1, 1.1]],
+        shape_native=(3, 2),
+        pixel_scales=1.0,
+    )
+
+    mapper = aa.m.MockMapper(
+        source_plane_mesh_grid=source_plane_mesh_grid, pixel_signals=pixel_signals
+    )
+
+    regularization_matrix = reg.regularization_matrix_from(linear_obj=mapper)
+
+    assert regularization_matrix[0, 0] == pytest.approx(18.7439565009, 1.0e-4)
+    assert regularization_matrix[0, 1] == pytest.approx(-8.786547368, 1.0e-4)
+
+    reg = aa.reg.MaternAdaptiveBrightnessKernel(coefficient=1.5, scale=2.5, nu=2.5, rho=1.5)
+
+    pixel_signals = np.array([1.0, 2.0, 3.0, 4.0, 5.0, 6.0])
+
+    mapper = aa.m.MockMapper(
+        source_plane_mesh_grid=source_plane_mesh_grid, pixel_signals=pixel_signals
+    )
+
+    regularization_matrix = reg.regularization_matrix_from(linear_obj=mapper)
+
+    assert regularization_matrix[0, 0] == pytest.approx(121.0190770, 1.0e-4)
+    assert regularization_matrix[0, 1] == pytest.approx(-66.9580331, 1.0e-4)