Source code for blackjax.util

"""Utility functions for BlackJax."""
from functools import partial
from typing import Callable, Union

import jax.numpy as jnp
from jax import jit, lax
from jax.flatten_util import ravel_pytree
from jax.random import normal, split
from jax.tree_util import tree_leaves

from blackjax.base import Info, SamplingAlgorithm, State, VIAlgorithm
from blackjax.progress_bar import progress_bar_scan
from blackjax.types import Array, ArrayLikeTree, ArrayTree, PRNGKey


@partial(jit, static_argnames=("precision",), inline=True)
[docs] def linear_map(diag_or_dense_a, b, *, precision="highest"): """Perform a linear map of the form y = Ax. Dispatch matrix multiplication to either jnp.dot or jnp.multiply. Unlike jax.numpy.dot, this function output an Array that match the dtype and shape of the 2nd input: - diag_or_dense_a is a scalar or 1d vector, `diag_or_dense_a * b` is returned - diag_or_dense_a is a 2d matrix, `diag_or_dense_a @ b` is returned Note that unlike jax.numpy.dot, here we defaults to full (highest) precision. This is more useful for numerical algorithms and will be the default for jax.numpy in the future: https://github.com/google/jax/pull/7859 Parameters ---------- diag_or_dense_a: A diagonal (1d vector) or dense matrix (2d square matrix). b: A vector. precision: The precision of the computation. See jax.lax.dot_general for more details. Returns ------- The result vector of the matrix multiplication. """ dtype = jnp.result_type(diag_or_dense_a.dtype, b.dtype) diag_or_dense_a = diag_or_dense_a.astype(dtype) b = b.astype(dtype) ndim = jnp.ndim(diag_or_dense_a) if ndim <= 1: return lax.mul(diag_or_dense_a, b) else: return lax.dot(diag_or_dense_a, b, precision=precision)
# TODO(https://github.com/blackjax-devs/blackjax/issues/376) # Refactor this function to not use ravel_pytree might be more performant.
[docs] def generate_gaussian_noise( rng_key: PRNGKey, position: ArrayLikeTree, mu: Union[float, Array] = 0.0, sigma: Union[float, Array] = 1.0, ) -> ArrayTree: """Generate N(mu, sigma) noise with output structure that match a given PyTree. Parameters ---------- rng_key: The pseudo-random number generator key used to generate random numbers. position: PyTree that the structure the output should to match. mu: The mean of the Gaussian distribution. sigma: The standard deviation of the Gaussian distribution. Returns ------- Gaussian noise following N(mu, sigma) that match the structure of position. """ p, unravel_fn = ravel_pytree(position) sample = normal(rng_key, shape=p.shape, dtype=p.dtype) return unravel_fn(mu + linear_map(sigma, sample))
[docs] def generate_unit_vector( rng_key: PRNGKey, position: ArrayLikeTree, ) -> Array: """Generate a random unit vector with output structure that match a given PyTree. Parameters ---------- rng_key: The pseudo-random number generator key used to generate random numbers. position: PyTree that the structure the output should to match. Returns ------- Random unit vector that match the structure of position. """ p, unravel_fn = ravel_pytree(position) sample = normal(rng_key, shape=p.shape, dtype=p.dtype) return unravel_fn(sample / jnp.linalg.norm(sample))
[docs] def pytree_size(pytree: ArrayLikeTree) -> int: """Return the dimension of the flatten PyTree.""" return sum(jnp.size(value) for value in tree_leaves(pytree))
[docs] def index_pytree(input_pytree: ArrayLikeTree) -> ArrayTree: """Builds a PyTree with elements indicating its corresponding index on a flat array. Various algorithms in BlackJAX take as input a 1 or 2 dimensional array which somehow affects the sampling or approximation of a PyTree. For instance, in HMC a 1 or 2 dimensional inverse mass matrix is used when simulating Hamilonian dynamics on PyTree position and momentum variables. It is usually unclear how the elements of the array interact with the PyTree. This function demonstrates how all algorithms map an array to a PyTree of equivalent dimension. The function returns the index of a 1 dimensional array corresponding to each element of the PyTree. This way the user can tell which element in the PyTree corresponds to which column (and row) of a 1 dimensional (or 2 dimensional) array. Parameters ---------- input_pytree: Example PyTree. Returns ------- PyTree mapping each individual element of an arange array to elements in the PyTree. """ flat_input, unravel_fn = ravel_pytree(input_pytree) (dim_input,) = flat_input.shape array = jnp.arange(dim_input, dtype=flat_input.dtype) return unravel_fn(array)
[docs] def run_inference_algorithm( rng_key: PRNGKey, initial_state_or_position: ArrayLikeTree, inference_algorithm: Union[SamplingAlgorithm, VIAlgorithm], num_steps: int, progress_bar: bool = False, transform: Callable = lambda x: x, ) -> tuple[State, State, Info]: """Wrapper to run an inference algorithm. Note that this utility function does not work for Stochastic Gradient MCMC samplers like sghmc, as SG-MCMC samplers require additional control flow for batches of data to be passed in during each sample. Parameters ---------- rng_key The random state used by JAX's random numbers generator. initial_state_or_position The initial state OR the initial position of the inference algorithm. If an initial position is passed in, the function will automatically convert it into an initial state. inference_algorithm One of blackjax's sampling algorithms or variational inference algorithms. num_steps Number of MCMC steps. progress_bar Whether to display a progress bar. transform A transformation of the trace of states to be returned. This is useful for computing determinstic variables, or returning a subset of the states. By default, the states are returned as is. Returns ------- Tuple[State, State, Info] 1. The final state of the inference algorithm. 2. The trace of states of the inference algorithm (contains the MCMC samples). 3. The trace of the info of the inference algorithm for diagnostics. """ init_key, sample_key = split(rng_key, 2) try: initial_state = inference_algorithm.init(initial_state_or_position, init_key) except (TypeError, ValueError, AttributeError): # We assume initial_state is already in the right format. initial_state = initial_state_or_position keys = split(sample_key, num_steps) @jit def _one_step(state, xs): _, rng_key = xs state, info = inference_algorithm.step(rng_key, state) return state, (transform(state), info) if progress_bar: one_step = progress_bar_scan(num_steps)(_one_step) else: one_step = _one_step xs = (jnp.arange(num_steps), keys) final_state, (state_history, info_history) = lax.scan(one_step, initial_state, xs) return final_state, state_history, info_history