-
Notifications
You must be signed in to change notification settings - Fork 107
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Partial posteriors SMC and refactor to decouple tempering from SMC co…
…nstruction (#729) * extracting taking last * test passing * layering * example * more * Adding another example * tests in place * rolling back changes * Adding test for num_mcmc_steps * format * better test coverage * linter * Flake8 * black * implementation[ * partial posteriors implementation * rolling back some changes * linter * fixing test * adding reference * typo * exposing in top level api * reruning precommit * adding more steps * smaller step size * fixes on comments * small fix on formating * renaming to data mask * linter
- Loading branch information
Showing
8 changed files
with
350 additions
and
59 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -6,4 +6,5 @@ | |
"tempered", | ||
"inner_kernel_tuning", | ||
"extend_params", | ||
"partial_posteriors_path", | ||
] |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,64 @@ | ||
from functools import partial | ||
from typing import Callable | ||
|
||
import jax | ||
|
||
from blackjax import smc | ||
from blackjax.smc.base import SMCState, update_and_take_last | ||
from blackjax.types import PRNGKey | ||
|
||
|
||
def build_kernel( | ||
mcmc_step_fn: Callable, | ||
mcmc_init_fn: Callable, | ||
resampling_fn: Callable, | ||
update_strategy: Callable = update_and_take_last, | ||
): | ||
"""SMC step from MCMC kernels. | ||
Builds MCMC kernels from the input parameters, which may change across iterations. | ||
Moreover, it defines the way such kernels are used to update the particles. This layer | ||
adapts an API defined in terms of kernels (mcmc_step_fn and mcmc_init_fn) into an API | ||
that depends on an update function over the set of particles. | ||
Returns | ||
------- | ||
A callable that takes a rng_key and a state with .particles and .weights and returns a base.SMCState | ||
and base.SMCInfo pair. | ||
""" | ||
|
||
def step( | ||
rng_key: PRNGKey, | ||
state, | ||
num_mcmc_steps: int, | ||
mcmc_parameters: dict, | ||
logposterior_fn: Callable, | ||
log_weights_fn: Callable, | ||
) -> tuple[smc.base.SMCState, smc.base.SMCInfo]: | ||
shared_mcmc_parameters = {} | ||
unshared_mcmc_parameters = {} | ||
for k, v in mcmc_parameters.items(): | ||
if v.shape[0] == 1: | ||
shared_mcmc_parameters[k] = v[0, ...] | ||
else: | ||
unshared_mcmc_parameters[k] = v | ||
|
||
shared_mcmc_step_fn = partial(mcmc_step_fn, **shared_mcmc_parameters) | ||
|
||
update_fn, num_resampled = update_strategy( | ||
mcmc_init_fn, | ||
logposterior_fn, | ||
shared_mcmc_step_fn, | ||
n_particles=state.weights.shape[0], | ||
num_mcmc_steps=num_mcmc_steps, | ||
) | ||
|
||
return smc.base.step( | ||
rng_key, | ||
SMCState(state.particles, state.weights, unshared_mcmc_parameters), | ||
update_fn, | ||
jax.vmap(log_weights_fn), | ||
resampling_fn, | ||
num_resampled, | ||
) | ||
|
||
return step |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,127 @@ | ||
from typing import Callable, NamedTuple, Optional, Tuple | ||
|
||
import jax | ||
import jax.numpy as jnp | ||
|
||
from blackjax import SamplingAlgorithm, smc | ||
from blackjax.smc.base import update_and_take_last | ||
from blackjax.smc.from_mcmc import build_kernel as smc_from_mcmc | ||
from blackjax.types import Array, ArrayLikeTree, ArrayTree, PRNGKey | ||
|
||
|
||
class PartialPosteriorsSMCState(NamedTuple): | ||
"""Current state for the tempered SMC algorithm. | ||
particles: PyTree | ||
The particles' positions. | ||
weights: | ||
Weights of the particles, so that they represent a probability distribution | ||
data_mask: | ||
A 1D boolean array to indicate which datapoints to include | ||
in the computation of the observed likelihood. | ||
""" | ||
|
||
particles: ArrayTree | ||
weights: Array | ||
data_mask: Array | ||
|
||
|
||
def init(particles: ArrayLikeTree, num_datapoints: int) -> PartialPosteriorsSMCState: | ||
"""num_datapoints are the number of observations that could potentially be | ||
used in a partial posterior. Since the initial data_mask is all 0s, it | ||
means that no likelihood term will be added (only prior). | ||
""" | ||
num_particles = jax.tree_util.tree_flatten(particles)[0][0].shape[0] | ||
weights = jnp.ones(num_particles) / num_particles | ||
return PartialPosteriorsSMCState(particles, weights, jnp.zeros(num_datapoints)) | ||
|
||
|
||
def build_kernel( | ||
mcmc_step_fn: Callable, | ||
mcmc_init_fn: Callable, | ||
resampling_fn: Callable, | ||
num_mcmc_steps: Optional[int], | ||
mcmc_parameters: ArrayTree, | ||
partial_logposterior_factory: Callable[[Array], Callable], | ||
update_strategy=update_and_take_last, | ||
) -> Callable: | ||
"""Build the Partial Posteriors (data tempering) SMC kernel. | ||
The distribution's trajectory includes increasingly adding more | ||
datapoints to the likelihood. See Section 2.2 of https://arxiv.org/pdf/2007.11936 | ||
Parameters | ||
---------- | ||
mcmc_step_fn | ||
A function that computes the log density of the prior distribution | ||
mcmc_init_fn | ||
A function that returns the probability at a given position. | ||
resampling_fn | ||
A random function that resamples generated particles based of weights | ||
num_mcmc_steps | ||
Number of iterations in the MCMC chain. | ||
mcmc_parameters | ||
A dictionary of parameters to be used by the inner MCMC kernels | ||
partial_logposterior_factory: | ||
A callable that given an array of 0 and 1, returns a function logposterior(x). | ||
The array represents which values to include in the logposterior calculation. The logposterior | ||
must be jax compilable. | ||
Returns | ||
------- | ||
A callable that takes a rng_key and PartialPosteriorsSMCState and selectors for | ||
the current and previous posteriors, and takes a data-tempered SMC state. | ||
""" | ||
delegate = smc_from_mcmc(mcmc_step_fn, mcmc_init_fn, resampling_fn, update_strategy) | ||
|
||
def step( | ||
key, state: PartialPosteriorsSMCState, data_mask: Array | ||
) -> Tuple[PartialPosteriorsSMCState, smc.base.SMCInfo]: | ||
logposterior_fn = partial_logposterior_factory(data_mask) | ||
|
||
previous_logposterior_fn = partial_logposterior_factory(state.data_mask) | ||
|
||
def log_weights_fn(x): | ||
return logposterior_fn(x) - previous_logposterior_fn(x) | ||
|
||
state, info = delegate( | ||
key, state, num_mcmc_steps, mcmc_parameters, logposterior_fn, log_weights_fn | ||
) | ||
|
||
return ( | ||
PartialPosteriorsSMCState(state.particles, state.weights, data_mask), | ||
info, | ||
) | ||
|
||
return step | ||
|
||
|
||
def as_top_level_api( | ||
mcmc_step_fn: Callable, | ||
mcmc_init_fn: Callable, | ||
mcmc_parameters: dict, | ||
resampling_fn: Callable, | ||
num_mcmc_steps, | ||
partial_logposterior_factory: Callable, | ||
update_strategy=update_and_take_last, | ||
) -> SamplingAlgorithm: | ||
"""A factory that wraps the kernel into a SamplingAlgorithm object. | ||
See build_kernel for full documentation on the parameters. | ||
""" | ||
|
||
kernel = build_kernel( | ||
mcmc_step_fn, | ||
mcmc_init_fn, | ||
resampling_fn, | ||
num_mcmc_steps, | ||
mcmc_parameters, | ||
partial_logposterior_factory, | ||
update_strategy, | ||
) | ||
|
||
def init_fn(position: ArrayLikeTree, num_observations, rng_key=None): | ||
del rng_key | ||
return init(position, num_observations) | ||
|
||
def step(key: PRNGKey, state: PartialPosteriorsSMCState, data_mask: Array): | ||
return kernel(key, state, data_mask) | ||
|
||
return SamplingAlgorithm(init_fn, step) # type: ignore[arg-type] |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.
5a25352
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Possible performance regression was detected for benchmark 'Python Benchmark with pytest-benchmark'.
Benchmark result of this commit is worse than the previous benchmark result exceeding threshold
2
.tests/test_benchmarks.py::test_regression_hmc
0.043374788288574655
iter/sec (stddev: 0.04990895128492592
)0.0983662024930494
iter/sec (stddev: 0.12340149282010071
)2.27
This comment was automatically generated by workflow using github-action-benchmark.