`cagpjax.models.cagp`

Computation-aware Gaussian Process models.

`ComputationAwareGP`

Bases: AbstractComputationAwareGP

Computation-aware Gaussian Process model.

This model implements scalable GP inference by using batch linear solver policies to project the kernel and data to a lower-dimensional subspace, while accounting for the extra uncertainty imposed by observing only this subspace.

Attributes:

Name	Type	Description
`posterior`	`ConjugatePosterior`	The original (exact) posterior.
`policy`	`AbstractBatchLinearSolverPolicy`	The batch linear solver policy.
`solver_method`	`AbstractLinearSolverMethod`	The linear solver method to use for solving linear systems with positive semi-definite operators.

Notes

Only single-output models are currently supported.

Source code in src/cagpjax/models/cagp.py

class ComputationAwareGP(AbstractComputationAwareGP):
    """Computation-aware Gaussian Process model.

    This model implements scalable GP inference by using batch linear solver
    policies to project the kernel and data to a lower-dimensional subspace, while
    accounting for the extra uncertainty imposed by observing only this subspace.

    Attributes:
        posterior: The original (exact) posterior.
        policy: The batch linear solver policy.
        solver_method: The linear solver method to use for solving linear systems
            with positive semi-definite operators.

    Notes:
        - Only single-output models are currently supported.
    """

    posterior: ConjugatePosterior
    policy: AbstractBatchLinearSolverPolicy
    solver_method: AbstractLinearSolverMethod

    def __init__(
        self,
        posterior: ConjugatePosterior,
        policy: AbstractBatchLinearSolverPolicy,
        solver_method: AbstractLinearSolverMethod = Cholesky(1e-6),
    ):
        """Initialize the Computation-Aware GP model.

        Args:
            posterior: GPJax conjugate posterior.
            policy: The batch linear solver policy that defines the subspace into
                which the data is projected.
            solver_method: The linear solver method to use for solving linear systems with
                positive semi-definite operators.
        """
        super().__init__(posterior)
        self.policy = policy
        self.solver_method = solver_method
        self._posterior_params: _ProjectedPosteriorParameters | None = None

    @property
    def is_conditioned(self) -> bool:
        """Whether the model has been conditioned on training data."""
        return self._posterior_params is not None

    def condition(self, train_data: Dataset) -> None:
        """Compute and store the projected quantities of the conditioned GP posterior.

        Args:
            train_data: The training data used to fit the GP.
        """
        # Ensure we have supervised training data
        if train_data.X is None or train_data.y is None:
            raise ValueError("Training data must be supervised.")

        # Unpack training data
        x = jnp.atleast_2d(train_data.X)
        y = jnp.atleast_1d(train_data.y).squeeze()

        # Unpack prior and likelihood
        prior = self.posterior.prior
        likelihood = self.posterior.likelihood

        # Mean and covariance of prior-predictive distribution
        mean_prior = prior.mean_function(x).squeeze()
        # Work around GPJax promoting dtype of mean to float64 (See JaxGaussianProcesses/GPJax#523)
        if isinstance(prior.mean_function, Constant):
            constant = prior.mean_function.constant
            if isinstance(constant, nnx.Variable):
                constant = constant.value
            mean_prior = mean_prior.astype(constant.dtype)
        cov_xx = lazify(prior.kernel.gram(x))
        obs_cov = diag_like(cov_xx, likelihood.obs_stddev.value**2)
        cov_prior = cov_xx + obs_cov

        # Project quantities to subspace
        actions = self.policy.to_actions(cov_prior)
        obs_cov_proj = congruence_transform(actions, obs_cov)
        cov_prior_proj = congruence_transform(actions, cov_prior)
        cov_prior_proj_solver = self.solver_method(cov_prior_proj)

        residual_proj = actions.T @ (y - mean_prior)
        repr_weights_proj = cov_prior_proj_solver.solve(residual_proj)

        self._posterior_params = _ProjectedPosteriorParameters(
            x=x,
            actions=actions,
            obs_cov_proj=obs_cov_proj,
            cov_prior_proj_solver=cov_prior_proj_solver,
            residual_proj=residual_proj,
            repr_weights_proj=repr_weights_proj,
        )

    @override
    def predict(
        self, test_inputs: Float[Array, "N D"] | None = None
    ) -> GaussianDistribution:
        """Compute the predictive distribution of the GP at the test inputs.

        ``condition`` must be called before this method can be used.

        Args:
            test_inputs: The test inputs at which to make predictions. If not provided,
                predictions are made at the training inputs.

        Returns:
            GaussianDistribution: The predictive distribution of the GP at the
                test inputs.
        """
        if not self.is_conditioned:
            raise ValueError("Model is not yet conditioned. Call ``condition`` first.")

        # help out pyright
        assert self._posterior_params is not None

        # Unpack posterior parameters
        x = self._posterior_params.x
        actions = self._posterior_params.actions
        cov_prior_proj_solver = self._posterior_params.cov_prior_proj_solver
        repr_weights_proj = self._posterior_params.repr_weights_proj

        # Predictions at test points
        z = test_inputs if test_inputs is not None else x
        prior = self.posterior.prior
        mean_z = prior.mean_function(z).squeeze()
        # Work around GPJax promoting dtype of mean to float64 (See JaxGaussianProcesses/GPJax#523)
        if isinstance(prior.mean_function, Constant):
            constant = prior.mean_function.constant
            if isinstance(constant, nnx.Variable):
                constant = constant.value
            mean_z = mean_z.astype(constant.dtype)
        cov_zz = lazify(prior.kernel.gram(z))
        cov_zx = cov_zz if test_inputs is None else prior.kernel.cross_covariance(z, x)
        cov_zx_proj = cov_zx @ actions

        # Posterior predictive distribution
        mean_pred = jnp.atleast_1d(mean_z + cov_zx_proj @ repr_weights_proj)
        cov_pred = cov_zz - cov_prior_proj_solver.inv_congruence_transform(
            cov_zx_proj.T
        )
        cov_pred = cola.PSD(cov_pred + diag_like(cov_pred, self.posterior.jitter))

        return GaussianDistribution(mean_pred, cov_pred)

    def prior_kl(self) -> ScalarFloat:
        r"""Compute KL divergence between CaGP posterior and GP prior..

        Calculates $\mathrm{KL}[q(f) || p(f)]$, where $q(f)$ is the CaGP
        posterior approximation and $p(f)$ is the GP prior.

        ``condition`` must be called before this method can be used.

        Returns:
            KL divergence value (scalar).
        """
        if not self.is_conditioned:
            raise ValueError("Model is not yet conditioned. Call ``condition`` first.")

        # help out pyright
        assert self._posterior_params is not None

        # Unpack posterior parameters
        obs_cov_proj = self._posterior_params.obs_cov_proj
        cov_prior_proj_solver = self._posterior_params.cov_prior_proj_solver
        residual_proj = self._posterior_params.residual_proj
        repr_weights_proj = self._posterior_params.repr_weights_proj

        obs_cov_proj_solver = self.solver_method(obs_cov_proj)

        kl = (
            _kl_divergence_from_solvers(
                residual_proj,
                obs_cov_proj_solver,
                jnp.zeros_like(residual_proj),
                cov_prior_proj_solver,
            )
            - 0.5 * congruence_transform(repr_weights_proj.T, obs_cov_proj).squeeze()
        )

        return kl

`is_conditioned` `property`

Whether the model has been conditioned on training data.

`init(posterior, policy, solver_method=Cholesky(1e-06))`

Initialize the Computation-Aware GP model.

Parameters:

Name	Type	Description	Default
`posterior`	`ConjugatePosterior`	GPJax conjugate posterior.	required
`policy`	`AbstractBatchLinearSolverPolicy`	The batch linear solver policy that defines the subspace into which the data is projected.	required
`solver_method`	`AbstractLinearSolverMethod`	The linear solver method to use for solving linear systems with positive semi-definite operators.	`Cholesky(1e-06)`

Source code in src/cagpjax/models/cagp.py

def __init__(
    self,
    posterior: ConjugatePosterior,
    policy: AbstractBatchLinearSolverPolicy,
    solver_method: AbstractLinearSolverMethod = Cholesky(1e-6),
):
    """Initialize the Computation-Aware GP model.

    Args:
        posterior: GPJax conjugate posterior.
        policy: The batch linear solver policy that defines the subspace into
            which the data is projected.
        solver_method: The linear solver method to use for solving linear systems with
            positive semi-definite operators.
    """
    super().__init__(posterior)
    self.policy = policy
    self.solver_method = solver_method
    self._posterior_params: _ProjectedPosteriorParameters | None = None

`condition(train_data)`

Compute and store the projected quantities of the conditioned GP posterior.

Parameters:

Name	Type	Description	Default
`train_data`	`Dataset`	The training data used to fit the GP.	required

Source code in src/cagpjax/models/cagp.py

def condition(self, train_data: Dataset) -> None:
    """Compute and store the projected quantities of the conditioned GP posterior.

    Args:
        train_data: The training data used to fit the GP.
    """
    # Ensure we have supervised training data
    if train_data.X is None or train_data.y is None:
        raise ValueError("Training data must be supervised.")

    # Unpack training data
    x = jnp.atleast_2d(train_data.X)
    y = jnp.atleast_1d(train_data.y).squeeze()

    # Unpack prior and likelihood
    prior = self.posterior.prior
    likelihood = self.posterior.likelihood

    # Mean and covariance of prior-predictive distribution
    mean_prior = prior.mean_function(x).squeeze()
    # Work around GPJax promoting dtype of mean to float64 (See JaxGaussianProcesses/GPJax#523)
    if isinstance(prior.mean_function, Constant):
        constant = prior.mean_function.constant
        if isinstance(constant, nnx.Variable):
            constant = constant.value
        mean_prior = mean_prior.astype(constant.dtype)
    cov_xx = lazify(prior.kernel.gram(x))
    obs_cov = diag_like(cov_xx, likelihood.obs_stddev.value**2)
    cov_prior = cov_xx + obs_cov

    # Project quantities to subspace
    actions = self.policy.to_actions(cov_prior)
    obs_cov_proj = congruence_transform(actions, obs_cov)
    cov_prior_proj = congruence_transform(actions, cov_prior)
    cov_prior_proj_solver = self.solver_method(cov_prior_proj)

    residual_proj = actions.T @ (y - mean_prior)
    repr_weights_proj = cov_prior_proj_solver.solve(residual_proj)

    self._posterior_params = _ProjectedPosteriorParameters(
        x=x,
        actions=actions,
        obs_cov_proj=obs_cov_proj,
        cov_prior_proj_solver=cov_prior_proj_solver,
        residual_proj=residual_proj,
        repr_weights_proj=repr_weights_proj,
    )

`predict(test_inputs=None)`

Compute the predictive distribution of the GP at the test inputs.

condition must be called before this method can be used.

Parameters:

Name	Type	Description	Default
`test_inputs`	`Float[Array, 'N D'] \| None`	The test inputs at which to make predictions. If not provided, predictions are made at the training inputs.	`None`

Returns:

Name	Type	Description
`GaussianDistribution`	`GaussianDistribution`	The predictive distribution of the GP at the test inputs.

Source code in src/cagpjax/models/cagp.py

@override
def predict(
    self, test_inputs: Float[Array, "N D"] | None = None
) -> GaussianDistribution:
    """Compute the predictive distribution of the GP at the test inputs.

    ``condition`` must be called before this method can be used.

    Args:
        test_inputs: The test inputs at which to make predictions. If not provided,
            predictions are made at the training inputs.

    Returns:
        GaussianDistribution: The predictive distribution of the GP at the
            test inputs.
    """
    if not self.is_conditioned:
        raise ValueError("Model is not yet conditioned. Call ``condition`` first.")

    # help out pyright
    assert self._posterior_params is not None

    # Unpack posterior parameters
    x = self._posterior_params.x
    actions = self._posterior_params.actions
    cov_prior_proj_solver = self._posterior_params.cov_prior_proj_solver
    repr_weights_proj = self._posterior_params.repr_weights_proj

    # Predictions at test points
    z = test_inputs if test_inputs is not None else x
    prior = self.posterior.prior
    mean_z = prior.mean_function(z).squeeze()
    # Work around GPJax promoting dtype of mean to float64 (See JaxGaussianProcesses/GPJax#523)
    if isinstance(prior.mean_function, Constant):
        constant = prior.mean_function.constant
        if isinstance(constant, nnx.Variable):
            constant = constant.value
        mean_z = mean_z.astype(constant.dtype)
    cov_zz = lazify(prior.kernel.gram(z))
    cov_zx = cov_zz if test_inputs is None else prior.kernel.cross_covariance(z, x)
    cov_zx_proj = cov_zx @ actions

    # Posterior predictive distribution
    mean_pred = jnp.atleast_1d(mean_z + cov_zx_proj @ repr_weights_proj)
    cov_pred = cov_zz - cov_prior_proj_solver.inv_congruence_transform(
        cov_zx_proj.T
    )
    cov_pred = cola.PSD(cov_pred + diag_like(cov_pred, self.posterior.jitter))

    return GaussianDistribution(mean_pred, cov_pred)

`prior_kl()`

Compute KL divergence between CaGP posterior and GP prior..

Calculates \(\mathrm{KL}[q(f) || p(f)]\), where \(q(f)\) is the CaGP posterior approximation and \(p(f)\) is the GP prior.

condition must be called before this method can be used.

Returns:

Type	Description
`ScalarFloat`	KL divergence value (scalar).

Source code in src/cagpjax/models/cagp.py

def prior_kl(self) -> ScalarFloat:
    r"""Compute KL divergence between CaGP posterior and GP prior..

    Calculates $\mathrm{KL}[q(f) || p(f)]$, where $q(f)$ is the CaGP
    posterior approximation and $p(f)$ is the GP prior.

    ``condition`` must be called before this method can be used.

    Returns:
        KL divergence value (scalar).
    """
    if not self.is_conditioned:
        raise ValueError("Model is not yet conditioned. Call ``condition`` first.")

    # help out pyright
    assert self._posterior_params is not None

    # Unpack posterior parameters
    obs_cov_proj = self._posterior_params.obs_cov_proj
    cov_prior_proj_solver = self._posterior_params.cov_prior_proj_solver
    residual_proj = self._posterior_params.residual_proj
    repr_weights_proj = self._posterior_params.repr_weights_proj

    obs_cov_proj_solver = self.solver_method(obs_cov_proj)

    kl = (
        _kl_divergence_from_solvers(
            residual_proj,
            obs_cov_proj_solver,
            jnp.zeros_like(residual_proj),
            cov_prior_proj_solver,
        )
        - 0.5 * congruence_transform(repr_weights_proj.T, obs_cov_proj).squeeze()
    )

    return kl

cagpjax.models.cagp

ComputationAwareGP

is_conditioned property

__init__(posterior, policy, solver_method=Cholesky(1e-06))

condition(train_data)

predict(test_inputs=None)

prior_kl()

`cagpjax.models.cagp`

`ComputationAwareGP`

`is_conditioned` `property`

`init(posterior, policy, solver_method=Cholesky(1e-06))`

`condition(train_data)`

`predict(test_inputs=None)`

`prior_kl()`