From bfa69da5e5ea12302068ad74f0b0eec8b71f0891 Mon Sep 17 00:00:00 2001
From: Josh Hope-Collins <joshua.hope-collins13@imperial.ac.uk>
Date: Mon, 10 Nov 2025 11:22:19 +0000
Subject: [PATCH] White noise generators and AR covariance operators

Co-authored-by: Jack Betteridge <j.betteridge@imperial.ac.uk>
---
 firedrake/adjoint/__init__.py                 |   2 +
 firedrake/adjoint/covariance_operator.py      | 445 ++++++++++++++++++
 .../adjoint/test_covariance_operator.py       | 187 ++++++++
 3 files changed, 634 insertions(+)
 create mode 100644 firedrake/adjoint/covariance_operator.py
 create mode 100644 tests/firedrake/adjoint/test_covariance_operator.py

diff --git a/firedrake/adjoint/__init__.py b/firedrake/adjoint/__init__.py
index d3d28e6129..d00ad97193 100644
--- a/firedrake/adjoint/__init__.py
+++ b/firedrake/adjoint/__init__.py
@@ -38,6 +38,8 @@
 from firedrake.adjoint.ufl_constraints import UFLInequalityConstraint, \
     UFLEqualityConstraint  # noqa F401
 from firedrake.adjoint.ensemble_reduced_functional import EnsembleReducedFunctional  # noqa F401
+from firedrake.adjoint.covariance_operator import (  # noqa F401
+    NoiseBackend, WhiteNoiseGenerator, GaussianCovarianceOperator, DiffusionFormulation)
 import numpy_adjoint  # noqa F401
 import firedrake.ufl_expr
 import types
diff --git a/firedrake/adjoint/covariance_operator.py b/firedrake/adjoint/covariance_operator.py
new file mode 100644
index 0000000000..dfd67b59cc
--- /dev/null
+++ b/firedrake/adjoint/covariance_operator.py
@@ -0,0 +1,445 @@
+from enum import Enum
+from functools import cached_property
+from textwrap import dedent
+from petsctools import get_petscvariables
+from loopy import generate_code_v2
+from pyop2 import op2
+from firedrake.tsfc_interface import compile_form
+from firedrake import (
+    grad, inner, avg, action, outer, replace,
+    assemble, CellSize, FacetNormal,
+    dx, ds, dS, sqrt, pi, Constant,
+    Function, Cofunction, RieszMap,
+    TrialFunction, TestFunction,
+    FunctionSpace, VectorFunctionSpace,
+    BrokenElement, VectorElement,
+    RandomGenerator, PCG64,
+    LinearVariationalProblem,
+    LinearVariationalSolver,
+    LinearSolver,
+)
+
+
+class DiffusionFormulation(Enum):
+    CG = 'CG'
+    DG = 'DG'
+
+
+def diffusion_form(u, v, kappa, formulation=DiffusionFormulation.CG):
+    if formulation == DiffusionFormulation.CG:
+        return inner(u, v)*dx + inner(kappa*grad(u), grad(v))*dx
+
+    elif formulation == DiffusionFormulation.DG:
+        mesh = v.function_space().mesh()
+        n = FacetNormal(mesh)
+        h = CellSize(mesh)
+        h_avg = 0.5*(h('+') + h('-'))
+        alpha_h = Constant(4.0)/h_avg
+        gamma_h = Constant(8.0)/h
+        return (
+            inner(u, v)*dx + kappa*(
+                inner(grad(u), grad(v))*dx
+                - inner(avg(2*outer(u, n)), avg(grad(v)))*dS
+                - inner(avg(grad(u)), avg(2*outer(v, n)))*dS
+                + alpha_h*inner(avg(2*outer(u, n)), avg(2*outer(v, n)))*dS
+                - inner(outer(u, n), grad(v))*ds
+                - inner(grad(u), outer(v, n))*ds
+                + gamma_h*inner(u, v)*ds
+            )
+        )
+
+    else:
+        raise ValueError("Unknown DiffusionFormulation {formulation}")
+
+
+class CholeskyFactorisation:
+    def __init__(self, V, form=None):
+        self._V = V
+
+        if form is None:
+            self.form = inner(TrialFunction(V),
+                              TestFunction(V))*dx
+        else:
+            self.form = form
+
+        self._wrk = Function(V)
+
+    @property
+    def function_space(self):
+        return self._V
+
+    @cached_property
+    def _assemble_action(self):
+        from firedrake.assemble import get_assembler
+        return get_assembler(action(self.form, self._wrk)).assemble
+
+    def assemble_action(self, u, tensor=None):
+        self._wrk.assign(u)
+        return self._assemble_action(tensor=tensor)
+
+    @cached_property
+    def solver(self):
+        return LinearSolver(
+            assemble(self.form, mat_type='aij'),
+            solver_parameters={
+                "ksp_type": "preonly",
+                "pc_type": "cholesky",
+                "pc_factor_mat_ordering_type": "nd"})
+
+    @cached_property
+    def pc(self):
+        return self.solver.ksp.getPC()
+
+    def apply(self, u):
+        u = self.assemble_action(u)
+        v = Cofunction(self.space.dual())
+        with u.dat.vec_ro as u_v, v.dat.vec_wo as v_v:
+            self.pc.applySymmetricLeft(u_v, v_v)
+        return v
+
+    def apply_transpose(self, u):
+        v = Function(self.function_space)
+        with u.dat.vec_ro as u_v, v.dat.vec_wo as v_v:
+            self.pc.applySymmetricRight(u_v, v_v)
+        v = self.assemble_action(v)
+        return v
+
+
+class NoiseBackend(Enum):
+    PYOP2 = 'pyop2'
+    PETSC = 'petsc'
+
+
+class NoiseBackendBase:
+    def __init__(self, V, rng=None):
+        self._V = V
+        self._rng = rng or RandomGenerator(PCG64())
+
+    def sample(self, *, rng=None, tensor=None):
+        raise NotImplementedError
+
+    @cached_property
+    def broken_space(self):
+        element = self.function_space.ufl_element()
+        mesh = self.function_space.mesh().unique()
+        if isinstance(element, VectorElement):
+            dim = element.num_sub_elements
+            scalar_element = element.sub_elements[0]
+            broken_element = BrokenElement(scalar_element)
+            Vbroken = VectorFunctionSpace(
+                mesh, broken_element, dim=dim)
+        else:
+            Vbroken = FunctionSpace(
+                mesh, BrokenElement(element))
+        return Vbroken
+
+    @property
+    def function_space(self):
+        return self._V
+
+    @property
+    def rng(self):
+        return self._rng
+
+    @cached_property
+    def riesz_map(self):
+        return RieszMap(self.function_space, constant_jacobian=True)
+
+
+class PetscNoiseBackend(NoiseBackendBase):
+    def __init__(self, V, rng=None):
+        super().__init__(V, rng=rng)
+        self.cholesky = CholeskyFactorisation(self.broken_space)
+
+    def sample(self, *, rng=None, tensor=None, apply_riesz=False):
+        V = self.function_space
+        rng = rng or self.rng
+
+        # z
+        z = rng.standard_normal(self.broken_space)
+        # C z
+        Cz = self.cholesky.apply_transpose(z)
+        # L C z
+        b = Cofunction(V.dual()).interpolate(Cz)
+
+        if apply_riesz:
+            b = b.riesz_representation(self.riesz_map)
+
+        if tensor:
+            tensor.assign(b)
+        else:
+            tensor = b
+
+        return tensor
+
+
+class PyOP2NoiseBackend(NoiseBackendBase):
+    def __init__(self, V, rng=None):
+        super().__init__(V, rng=rng)
+
+        u = TrialFunction(V)
+        v = TestFunction(V)
+        mass = inner(u, v)*dx
+
+        # Create mass expression, assemble and extract kernel
+        mass_ker, *stuff = compile_form(mass, "mass")
+        mass_code = generate_code_v2(mass_ker.kinfo.kernel.code).device_code()
+        mass_code = mass_code.replace(
+            "void " + mass_ker.kinfo.kernel.name,
+            "static void " + mass_ker.kinfo.kernel.name)
+
+        # Add custom code for doing Cholesky
+        # decomposition and applying to broken vector
+        name = mass_ker.kinfo.kernel.name
+        blocksize = mass_ker.kinfo.kernel.code[name].args[0].shape[0]
+
+        cholesky_code = dedent(
+            f"""\
+            extern void dpotrf_(char *UPLO,
+                                int *N,
+                                double *A,
+                                int *LDA,
+                                int *INFO);
+
+            extern void dgemv_(char *TRANS,
+                               int *M,
+                               int *N,
+                               double *ALPHA,
+                               double *A,
+                               int *LDA,
+                               double *X,
+                               int *INCX,
+                               double *BETA,
+                               double *Y,
+                               int *INCY);
+
+            {mass_code}
+
+            void apply_cholesky(double *__restrict__ z,
+                                double *__restrict__ b,
+                                double const *__restrict__ coords)
+            {{
+                char uplo[1];
+                int32_t N = {blocksize}, LDA = {blocksize}, INFO = 0;
+                int32_t i=0, j=0;
+                uplo[0] = 'u';
+                double H[{blocksize}*{blocksize}] = {{{{ 0.0 }}}};
+
+                char trans[1];
+                int32_t stride = 1;
+                double scale = 1.0;
+                double zero = 0.0;
+
+                {mass_ker.kinfo.kernel.name}(H, coords);
+
+                uplo[0] = 'u';
+                dpotrf_(uplo, &N, H, &LDA, &INFO);
+                for (int i = 0; i < N; i++)
+                    for (int j = 0; j < N; j++)
+                        if (j>i)
+                            H[i*N + j] = 0.0;
+
+                trans[0] = 'T';
+                dgemv_(trans, &N, &N, &scale, H, &LDA, z, &stride, &zero, b, &stride);
+            }}
+            """
+        )
+
+        # Get the BLAS and LAPACK compiler parameters to compile the kernel
+        # TODO: Ask CW if this is the right comm to use.
+        comm = V.mesh()._comm
+        if comm.rank == 0:
+            petsc_variables = get_petscvariables()
+            BLASLAPACK_LIB = petsc_variables.get("BLASLAPACK_LIB", "")
+            BLASLAPACK_LIB = comm.bcast(BLASLAPACK_LIB, root=0)
+            BLASLAPACK_INCLUDE = petsc_variables.get("BLASLAPACK_INCLUDE", "")
+            BLASLAPACK_INCLUDE = comm.bcast(BLASLAPACK_INCLUDE, root=0)
+        else:
+            BLASLAPACK_LIB = comm.bcast(None, root=0)
+            BLASLAPACK_INCLUDE = comm.bcast(None, root=0)
+
+        self.cholesky_kernel = op2.Kernel(
+            cholesky_code, "apply_cholesky",
+            include_dirs=BLASLAPACK_INCLUDE.split(),
+            ldargs=BLASLAPACK_LIB.split())
+
+    def sample(self, *, rng=None, tensor=None, apply_riesz=False):
+        rng = rng or self.rng
+
+        z = rng.standard_normal(self.broken_space)
+        b = Cofunction(self.function_space.dual())
+
+        z_arg = z.dat(op2.READ, self.broken_space.cell_node_map())
+        b_arg = b.dat(op2.INC, self.function_space.cell_node_map())
+
+        mesh = self.function_space.mesh()
+        coords = mesh.coordinates
+        c_arg = coords.dat(op2.READ, coords.cell_node_map())
+
+        op2.par_loop(
+            self.cholesky_kernel,
+            mesh.cell_set,
+            z_arg, b_arg, c_arg
+        )
+
+        if apply_riesz:
+            b = b.riesz_representation(self.riesz_map)
+
+        if tensor:
+            tensor.assign(b)
+        else:
+            tensor = b
+
+        return tensor
+
+
+class WhiteNoiseGenerator:
+    r""" Generates a white noise sample
+
+    :arg V: The :class: `firedrake.FunctionSpace` to construct a
+        white noise sample on
+    :arg backend: The :enum: `NoiseBackend` specifying how to calculate
+        and apply the mass matrix square root.
+    :arg rng: Initialised random number generator to use for obtaining
+        random numbers. Defaults to PCG64.
+
+    Returns a :firedrake.Function: with
+    b ~ Normal(0, M)
+    where b is the dat.data of the function returned
+    and M is the mass matrix.
+
+    For details see [Croci et al 2018]:
+    https://epubs.siam.org/doi/10.1137/18M1175239
+    """
+
+    # TODO: Add Croci to citations manager
+
+    def __init__(self, V, backend=NoiseBackend.PYOP2, rng=None):
+        if backend == NoiseBackend.PYOP2:
+            self.backend = PyOP2NoiseBackend(V, rng=rng)
+        elif backend == NoiseBackend.PETSC:
+            self.backend = PetscNoiseBackend(V, rng=rng)
+        else:
+            raise ValueError(
+                f"Unrecognised white noise generation backend {backend}")
+
+        self.function_space = self.backend.function_space
+        self.rng = self.backend.rng
+
+    def sample(self, *, rng=None, tensor=None, apply_riesz=False):
+        return self.backend.sample(
+            rng=rng, tensor=tensor, apply_riesz=apply_riesz)
+
+
+class GaussianCovarianceOperator:
+    def __init__(self, V, L, sigma=1, m=2, rng=None,
+                 bcs=None, form=DiffusionFormulation.CG,
+                 solver_parameters=None, options_prefix=None):
+
+        self.rng = rng or WhiteNoiseGenerator(V)
+        self.function_space = self.rng.function_space
+
+        if sigma <= 0:
+            raise ValueError("Variance must be positive.")
+        if L < 0:
+            raise ValueError("Correlation lengthscale must be positive.")
+        if m < 0:
+            raise ValueError("Number of iterations must be positive.")
+        if (m % 2) != 0:
+            raise ValueError("Number of iterations must be even.")
+
+        self.stddev = sigma
+        self.lengthscale = L
+        self.iterations = m
+
+        if self.iterations > 0:
+            # Calculate diffusion operator parameters
+            self.kappa = Constant(L*L/(2*m))
+            lambda_g = Constant(sqrt(2*pi)*L)
+            self.lamda = Constant(sigma*sqrt(lambda_g))
+
+            # setup diffusion solver
+            u, v = TrialFunction(V), TestFunction(V)
+            if isinstance(form, DiffusionFormulation):
+                a = diffusion_form(u, v, self.kappa, formulation=form)
+            else:
+                a = form
+            self._rhs = Function(V)
+            rhs = inner(self._rhs, v)*dx
+            self._u = Function(V)
+
+            self.solver = LinearVariationalSolver(
+                LinearVariationalProblem(a, rhs, self._u, bcs=bcs,
+                                         constant_jacobian=True),
+                solver_parameters=solver_parameters,
+                options_prefix=options_prefix)
+
+            # setup mass solver
+            M = inner(u, v)*dx
+            rhs = replace(a, {u: self._rhs})
+
+            self.mass_solver = LinearVariationalSolver(
+                LinearVariationalProblem(M, rhs, self._u, bcs=bcs,
+                                         constant_jacobian=True),
+                solver_parameters=solver_parameters)
+
+    def sample(self, *, rng=None, tensor=None):
+        tensor = tensor or Function(self.function_space)
+        rng = rng or self.rng
+        w = rng.sample(apply_riesz=True)
+
+        if self.iterations == 0:
+            return tensor.assign(self.lamda*w)
+
+        self._u.assign(w)
+        for _ in range(self.iterations//2):
+            self._rhs.assign(self._u)
+            self.solver.solve()
+
+        return tensor.assign(self.lamda*self._u)
+
+    def norm(self, x):
+
+        if self.iterations == 0:
+            sigma_x = self.stddev*x
+            return assemble(inner(sigma_x, sigma_x)*dx)
+
+        lamda1 = 1/self.lamda
+
+        self._u.assign(lamda1*x)
+        for k in range(self.iterations//2):
+            self._rhs.assign(self._u)
+            self.mass_solver.solve()
+
+        return assemble(inner(self._u, self._u)*dx)
+
+    def apply_inverse(self, x, *, tensor=None):
+        tensor = tensor or Function(self.function_space)
+
+        if self.iterations == 0:
+            variance1 = 1/(self.stddev*self.stddev)
+            return tensor.assign(variance1*x)
+
+        lamda1 = 1/self.lamda
+        self._u.assign(lamda1*x)
+
+        for k in range(self.iterations):
+            self._rhs.assign(self._u)
+            self.mass_solver.solve()
+
+        return tensor.assign(lamda1*self._u)
+
+    def apply_action(self, x, *, tensor=None):
+        tensor = tensor or Function(self.function_space)
+
+        if self.iterations == 0:
+            variance = self.stddev*self.stddev
+            return tensor.assign(variance*x)
+
+        self._u.assign(self.lamda*x)
+
+        for k in range(self.iterations):
+            self._rhs.assign(self._u)
+            self.solver.solve()
+
+        return tensor.assign(self.lamda*self._u)
diff --git a/tests/firedrake/adjoint/test_covariance_operator.py b/tests/firedrake/adjoint/test_covariance_operator.py
new file mode 100644
index 0000000000..aa0ad075b0
--- /dev/null
+++ b/tests/firedrake/adjoint/test_covariance_operator.py
@@ -0,0 +1,187 @@
+import pytest
+import numpy as np
+from scipy.sparse import csr_matrix
+from firedrake import *
+from firedrake.adjoint import *
+
+
+def petsc2numpy_vec(petsc_vec):
+    """Allgather a PETSc.Vec."""
+    gvec = petsc_vec
+    gather, lvec = PETSc.Scatter().toAll(gvec)
+    gather(gvec, lvec, addv=PETSc.InsertMode.INSERT_VALUES)
+    return lvec.array_r.copy()
+
+
+def petsc2numpy_mat(petsc_mat):
+    """Allgather a PETSc.Mat."""
+    comm = petsc_mat.getComm()
+    local_mat = petsc_mat.getRedundantMatrix(
+        comm.size, PETSc.COMM_SELF)
+    return csr_matrix(
+        local_mat.getValuesCSR()[::-1],
+        shape=local_mat.getSize()
+    ).todense()
+
+
+@pytest.mark.parallel([1, 2])
+@pytest.mark.parametrize("degree", (1, 2), ids=["degree1", "degree2"])
+@pytest.mark.parametrize("dim", (0, 1, 2), ids=["scalar", "vec1", "vec2"])
+@pytest.mark.parametrize("family", ("CG", "DG"))
+@pytest.mark.parametrize("mesh_type", ("interval", "square"))
+@pytest.mark.parametrize("backend", ("pyop2", "petsc"))
+def test_white_noise(family, degree, mesh_type, dim, backend):
+    """Test that white noise generator converges to a mass matrix covariance.
+    """
+    if backend == "petsc" and COMM_WORLD.size > 1:
+        pytest.skip(
+            "petsc backend for noise generation not implemented in parallel.")
+
+    nx = 10
+    # Mesh dimension
+    if mesh_type == 'interval':
+        mesh = UnitIntervalMesh(nx)
+    elif mesh_type == 'square':
+        mesh = UnitSquareMesh(nx, nx)
+    elif mesh_type == 'cube':
+        mesh = UnitCubeMesh(nx, nx, nx)
+
+    # Variable rank
+    if dim > 0:
+        V = VectorFunctionSpace(mesh, family, degree, dim=dim)
+    else:
+        V = FunctionSpace(mesh, family, degree)
+
+    # Finite element white noise has mass matrix covariance
+    M = inner(TrialFunction(V), TestFunction(V))*dx
+    covmat = petsc2numpy_mat(
+        assemble(M, mat_type='aij').petscmat)
+
+    rng = RandomGenerator(PCG64(seed=13))
+
+    generator = WhiteNoiseGenerator(
+        V, backend=NoiseBackend(backend), rng=rng)
+
+    # Test convergence as sample size increases
+    nsamples = [50, 100, 200, 400, 800]
+
+    samples = np.empty((V.dim(), nsamples[-1]))
+    for i in range(nsamples[-1]):
+        with generator.sample().dat.vec_ro as bv:
+            samples[:, i] = petsc2numpy_vec(bv)
+
+    covariances = [np.cov(samples[:, :ns]) for ns in nsamples]
+
+    # Covariance matrix should converge at a rate of sqrt(n)
+    errors = [np.linalg.norm(cov-covmat) for cov in covariances]
+    normalised_errors = [err*sqrt(n) for err, n in zip(errors, nsamples)]
+    normalised_errors /= normalised_errors[-1]
+
+    # Loose tolerance because RNG
+    tol = 0.2
+    assert (1 - tol) < np.max(normalised_errors) < (1 + tol)
+
+
+@pytest.mark.parallel([1, 2])
+@pytest.mark.parametrize("m", (0, 2, 4))
+@pytest.mark.parametrize("degree", (1, 2), ids=["degree1", "degree2"])
+@pytest.mark.parametrize("dim", (0, 1, 2), ids=["scalar", "vector1", "vector2"])
+@pytest.mark.parametrize("family", ("CG", "DG"))
+@pytest.mark.parametrize("mesh_type", ("interval", "square"))
+@pytest.mark.parametrize("backend", ("pyop2", "petsc"))
+def test_covariance_inverse_action(m, family, degree, mesh_type, dim, backend):
+    """Test that correlated noise generator has the right covariance matrix.
+    """
+    if backend == "petsc" and COMM_WORLD.size > 1:
+        pytest.skip(
+            "petsc backend for noise generation not implemented in parallel.")
+
+    nx = 16
+    if mesh_type == 'interval':
+        mesh = UnitIntervalMesh(nx)
+        x, = SpatialCoordinate(mesh)
+        wexpr = cos(2*pi*x)
+    elif mesh_type == 'square':
+        mesh = UnitSquareMesh(nx, nx)
+        x, y = SpatialCoordinate(mesh)
+        wexpr = cos(2*pi*x)*cos(4*pi*x)
+    elif mesh_type == 'cube':
+        mesh = UnitCubeMesh(nx, nx, nx)
+        x, y, z = SpatialCoordinate(mesh)
+        wexpr = cos(2*pi*x)*cos(4*pi*y)*cos(pi*z)
+    if dim > 0:
+        V = VectorFunctionSpace(mesh, family, degree, dim=dim)
+        wexpr = as_vector([-1**(j+1)*wexpr for j in range(dim)])
+    else:
+        V = FunctionSpace(mesh, family, degree)
+
+    rng = WhiteNoiseGenerator(
+        V, backend=NoiseBackend(backend),
+        rng=RandomGenerator(PCG64(seed=13)))
+
+    L = 0.1
+    sigma = 0.9
+
+    solver_parameters = {
+        'ksp_type': 'preonly',
+        'pc_type': 'lu',
+        'pc_factor_mat_solver_type': 'mumps'
+    }
+
+    B = GaussianCovarianceOperator(
+        V, L, sigma, m, rng=rng,
+        solver_parameters=solver_parameters, options_prefix="",
+        form=DiffusionFormulation(family))
+
+    w = Function(V).project(wexpr)
+    wcheck = B.apply_inverse(B.apply_action(w))
+
+    tol = 1e-8
+    # Particularly sensitive tests??
+    if mesh_type == 'square' and family == 'DG' and degree == 2 and m == 4:
+        tol = 5e-4
+
+    assert errornorm(w, wcheck) < tol
+
+
+@pytest.mark.parallel([1, 2])
+@pytest.mark.parametrize("m", (0, 2, 4))
+@pytest.mark.parametrize("family", ("CG", "DG"))
+@pytest.mark.parametrize("backend", ("pyop2", "petsc"))
+def test_covariance_adjoint_norm(m, family, backend):
+    """Test that correlated noise generator has the right covariance matrix.
+    """
+    if backend == "petsc" and COMM_WORLD.size > 1:
+        pytest.skip(
+            "petsc backend for noise generation not implemented in parallel.")
+    nx = 20
+    L = 0.2
+    sigma = 0.1
+
+    mesh = UnitIntervalMesh(nx)
+    x, = SpatialCoordinate(mesh)
+
+    V = FunctionSpace(mesh, family, 1)
+
+    u = Function(V).project(sin(2*pi*x))
+    v = Function(V).project(2 - 0.5*sin(6*pi*x))
+
+    B = GaussianCovarianceOperator(
+        V, L, sigma, m,
+        form=DiffusionFormulation(family))
+
+    continue_annotation()
+    with set_working_tape() as tape:
+        w = Function(V).project(u**4 + v)
+        J = B.norm(w)
+        Jhat = ReducedFunctional(J, Control(u), tape=tape)
+    pause_annotation()
+
+    m = Function(V).project(sin(2*pi*(x+0.2)))
+    h = Function(V).project(sin(4*pi*(x-0.2)))
+
+    taylor = taylor_to_dict(Jhat, m, h)
+
+    assert min(taylor['R0']['Rate']) > 0.95, taylor['R0']
+    assert min(taylor['R1']['Rate']) > 1.95, taylor['R1']
+    assert min(taylor['R2']['Rate']) > 2.95, taylor['R2']