From 183fdf902d3baeefb9b824bbde16cddee5ffa8ea Mon Sep 17 00:00:00 2001
From: slamitza <alessandro.slamitz@roche.com>
Date: Sun, 21 Jan 2024 17:30:23 +0100
Subject: [PATCH] fixed test

---
 .../experimental/mcmc/particle_filter.py      |  17 +-
 .../experimental/mcmc/particle_filter_test.py | 854 +-----------------
 2 files changed, 20 insertions(+), 851 deletions(-)

diff --git a/tensorflow_probability/python/experimental/mcmc/particle_filter.py b/tensorflow_probability/python/experimental/mcmc/particle_filter.py
index 2322d5a5ec..c5060747ee 100644
--- a/tensorflow_probability/python/experimental/mcmc/particle_filter.py
+++ b/tensorflow_probability/python/experimental/mcmc/particle_filter.py
@@ -446,7 +446,7 @@ def seeded_one_step(seed_state_results, _):
 
 
 def smc_squared(
-    inner_observations,
+    observations,
     initial_parameter_prior,
     num_outer_particles,
     inner_initial_state_prior,
@@ -474,14 +474,14 @@ def smc_squared(
       seed, n=3, salt='smc_squared'
   )
 
-  num_observation_steps = ps.size0(tf.nest.flatten(inner_observations)[0])
+  num_observation_steps = ps.size0(tf.nest.flatten(observations)[0])
 
   # TODO: The following two lines compensates for having the
   #  first empty step in smc2
   num_timesteps = (1 + num_transitions_per_observation *
                    (num_observation_steps - 1)) + 1
-  last_obs_expanded = tf.expand_dims(inner_observations[-1], axis=0)
-  inner_observations = tf.concat([inner_observations,
+  last_obs_expanded = tf.expand_dims(observations[-1], axis=0)
+  inner_observations = tf.concat([observations,
                                   last_obs_expanded],
                                  axis=0)
 
@@ -1104,12 +1104,13 @@ def _compute_observation_log_weights(step,
     observation = tf.nest.map_structure(
         lambda x, step=step: tf.gather(x, observation_idx), observations)
 
-    if particles_dim == 1:
-      observation = tf.expand_dims(observation, axis=0)
-    observation = tf.nest.map_structure(
-        lambda x: tf.expand_dims(x, axis=particles_dim), observation)
+    if particles_dim != 1:
+      observation = tf.nest.map_structure(
+          lambda x: tf.expand_dims(x, axis=particles_dim), observation
+      )
 
     log_weights = observation_fn(step, particles).log_prob(observation)
+
     return tf.where(step_has_observation,
                     log_weights,
                     tf.zeros_like(log_weights))
diff --git a/tensorflow_probability/python/experimental/mcmc/particle_filter_test.py b/tensorflow_probability/python/experimental/mcmc/particle_filter_test.py
index 8e9a140999..235ef57237 100644
--- a/tensorflow_probability/python/experimental/mcmc/particle_filter_test.py
+++ b/tensorflow_probability/python/experimental/mcmc/particle_filter_test.py
@@ -41,700 +41,6 @@
 @test_util.test_all_tf_execution_regimes
 class _ParticleFilterTest(test_util.TestCase):
 
-  def test_random_walk(self):
-    initial_state_prior = jdn.JointDistributionNamed(
-        {'position': deterministic.Deterministic(0.)})
-
-    # Biased random walk.
-    def particle_dynamics(_, previous_state):
-      state_shape = ps.shape(previous_state['position'])
-      return jdn.JointDistributionNamed({
-          'position':
-              transformed_distribution.TransformedDistribution(
-                  bernoulli.Bernoulli(
-                      probs=tf.fill(state_shape, 0.75), dtype=self.dtype),
-                  shift.Shift(previous_state['position']))
-      })
-
-    # Completely uninformative observations allowing a test
-    # of the pure dynamics.
-    def particle_observations(_, state):
-      state_shape = ps.shape(state['position'])
-      return uniform.Uniform(
-          low=tf.fill(state_shape, -100.), high=tf.fill(state_shape, 100.))
-
-    observations = tf.zeros((9,), dtype=self.dtype)
-    trajectories, _ = self.evaluate(
-        particle_filter.infer_trajectories(
-            observations=observations,
-            initial_state_prior=initial_state_prior,
-            transition_fn=particle_dynamics,
-            observation_fn=particle_observations,
-            num_particles=16384,
-            seed=test_util.test_seed()))
-    position = trajectories['position']
-
-    # The trajectories have the following properties:
-    # 1. they lie completely in the range [0, 8]
-    self.assertAllInRange(position, 0., 8.)
-    # 2. each step lies in the range [0, 1]
-    self.assertAllInRange(position[1:] - position[:-1], 0., 1.)
-    # 3. the expectation and variance of the final positions are 6 and 1.5.
-    self.assertAllClose(tf.reduce_mean(position[-1]), 6., atol=0.1)
-    self.assertAllClose(tf.math.reduce_variance(position[-1]), 1.5, atol=0.1)
-
-  def test_batch_of_filters(self):
-
-    batch_shape = [3, 2]
-    num_particles = 1000
-    num_timesteps = 40
-
-    # Batch of priors on object 1D positions and velocities.
-    initial_state_prior = jdn.JointDistributionNamed({
-        'position': normal.Normal(loc=0., scale=tf.ones(batch_shape)),
-        'velocity': normal.Normal(loc=0., scale=tf.ones(batch_shape) * 0.1)
-    })
-
-    def transition_fn(_, previous_state):
-      return jdn.JointDistributionNamed({
-          'position':
-              normal.Normal(
-                  loc=previous_state['position'] + previous_state['velocity'],
-                  scale=0.1),
-          'velocity':
-              normal.Normal(loc=previous_state['velocity'], scale=0.01)
-      })
-
-    def observation_fn(_, state):
-      return normal.Normal(loc=state['position'], scale=0.1)
-
-    # Batch of synthetic observations, .
-    true_initial_positions = np.random.randn(*batch_shape).astype(self.dtype)
-    true_velocities = 0.1 * np.random.randn(
-        *batch_shape).astype(self.dtype)
-    observed_positions = (
-        true_velocities *
-        np.arange(num_timesteps).astype(
-            self.dtype)[..., tf.newaxis, tf.newaxis] +
-        true_initial_positions)
-
-    (particles, log_weights, parent_indices,
-     incremental_log_marginal_likelihoods) = self.evaluate(
-         particle_filter.particle_filter(
-             observations=observed_positions,
-             initial_state_prior=initial_state_prior,
-             transition_fn=transition_fn,
-             observation_fn=observation_fn,
-             num_particles=num_particles,
-             seed=test_util.test_seed()))
-
-    self.assertAllEqual(particles['position'].shape,
-                        [num_timesteps, num_particles] + batch_shape)
-    self.assertAllEqual(particles['velocity'].shape,
-                        [num_timesteps, num_particles] + batch_shape)
-    self.assertAllEqual(parent_indices.shape,
-                        [num_timesteps, num_particles] + batch_shape)
-    self.assertAllEqual(incremental_log_marginal_likelihoods.shape,
-                        [num_timesteps] + batch_shape)
-
-    self.assertAllClose(
-        self.evaluate(
-            tf.reduce_sum(tf.exp(log_weights) *
-                          particles['position'], axis=1)),
-        observed_positions,
-        atol=0.1)
-
-    velocity_means = tf.reduce_sum(tf.exp(log_weights) *
-                                   particles['velocity'], axis=1)
-    self.assertAllClose(
-        self.evaluate(tf.reduce_mean(velocity_means, axis=0)),
-        true_velocities, atol=0.05)
-
-    # Uncertainty in velocity should decrease over time.
-    velocity_stddev = self.evaluate(
-        tf.math.reduce_std(particles['velocity'], axis=1))
-    self.assertAllLess((velocity_stddev[-1] - velocity_stddev[0]), 0.)
-
-    trajectories = self.evaluate(
-        particle_filter.reconstruct_trajectories(particles, parent_indices))
-    self.assertAllEqual([num_timesteps, num_particles] + batch_shape,
-                        trajectories['position'].shape)
-    self.assertAllEqual([num_timesteps, num_particles] + batch_shape,
-                        trajectories['velocity'].shape)
-
-    # Verify that `infer_trajectories` also works on batches.
-    trajectories, incremental_log_marginal_likelihoods = self.evaluate(
-        particle_filter.infer_trajectories(
-            observations=observed_positions,
-            initial_state_prior=initial_state_prior,
-            transition_fn=transition_fn,
-            observation_fn=observation_fn,
-            num_particles=num_particles,
-            seed=test_util.test_seed()))
-    self.assertAllEqual([num_timesteps, num_particles] + batch_shape,
-                        trajectories['position'].shape)
-    self.assertAllEqual([num_timesteps, num_particles] + batch_shape,
-                        trajectories['velocity'].shape)
-    self.assertAllEqual(incremental_log_marginal_likelihoods.shape,
-                        [num_timesteps] + batch_shape)
-
-  def test_batch_of_filters_particles_dim_1(self):
-
-    batch_shape = [3, 2]
-    num_particles = 1000
-    num_timesteps = 40
-
-    # Batch of priors on object 1D positions and velocities.
-    initial_state_prior = jdn.JointDistributionNamed({
-        'position': normal.Normal(loc=0., scale=tf.ones(batch_shape)),
-        'velocity': normal.Normal(loc=0., scale=tf.ones(batch_shape) * 0.1)
-    })
-
-    def transition_fn(_, previous_state):
-      return jdn.JointDistributionNamed({
-          'position':
-              normal.Normal(
-                  loc=previous_state['position'] + previous_state['velocity'],
-                  scale=0.1),
-          'velocity':
-              normal.Normal(loc=previous_state['velocity'], scale=0.01)
-      })
-
-    def observation_fn(_, state):
-      return normal.Normal(loc=state['position'], scale=0.1)
-
-    # Batch of synthetic observations, .
-    true_initial_positions = np.random.randn(*batch_shape).astype(self.dtype)
-    true_velocities = 0.1 * np.random.randn(
-        *batch_shape).astype(self.dtype)
-    observed_positions = (
-        true_velocities *
-        np.arange(num_timesteps).astype(
-            self.dtype)[..., tf.newaxis, tf.newaxis] +
-        true_initial_positions)
-
-    (particles, log_weights, parent_indices,
-     incremental_log_marginal_likelihoods) = self.evaluate(
-         particle_filter.particle_filter(
-             observations=observed_positions,
-             initial_state_prior=initial_state_prior,
-             transition_fn=transition_fn,
-             observation_fn=observation_fn,
-             num_particles=num_particles,
-             seed=test_util.test_seed(),
-             particles_dim=1))
-
-    self.assertAllEqual(particles['position'].shape,
-                        [num_timesteps,
-                         batch_shape[0],
-                         num_particles,
-                         batch_shape[1]])
-    self.assertAllEqual(particles['velocity'].shape,
-                        [num_timesteps,
-                         batch_shape[0],
-                         num_particles,
-                         batch_shape[1]])
-    self.assertAllEqual(parent_indices.shape,
-                        [num_timesteps,
-                         batch_shape[0],
-                         num_particles,
-                         batch_shape[1]])
-    self.assertAllEqual(incremental_log_marginal_likelihoods.shape,
-                        [num_timesteps] + batch_shape)
-
-    self.assertAllClose(
-        self.evaluate(
-            tf.reduce_sum(tf.exp(log_weights) *
-                          particles['position'], axis=2)),
-        observed_positions,
-        atol=0.3)
-
-    velocity_means = tf.reduce_sum(tf.exp(log_weights) *
-                                   particles['velocity'], axis=2)
-
-    self.assertAllClose(
-        self.evaluate(tf.reduce_mean(velocity_means, axis=0)),
-        true_velocities, atol=0.05)
-
-    # Uncertainty in velocity should decrease over time.
-    velocity_stddev = self.evaluate(
-        tf.math.reduce_std(particles['velocity'], axis=2))
-    self.assertAllLess((velocity_stddev[-1] - velocity_stddev[0]), 0.)
-
-    trajectories = self.evaluate(
-        particle_filter.reconstruct_trajectories(particles,
-                                                 parent_indices,
-                                                 particles_dim=1))
-    self.assertAllEqual([num_timesteps,
-                         batch_shape[0],
-                         num_particles,
-                         batch_shape[1]],
-                        trajectories['position'].shape)
-    self.assertAllEqual([num_timesteps,
-                         batch_shape[0],
-                         num_particles,
-                         batch_shape[1]],
-                        trajectories['velocity'].shape)
-
-    # Verify that `infer_trajectories` also works on batches.
-    trajectories, incremental_log_marginal_likelihoods = self.evaluate(
-        particle_filter.infer_trajectories(
-            observations=observed_positions,
-            initial_state_prior=initial_state_prior,
-            transition_fn=transition_fn,
-            observation_fn=observation_fn,
-            num_particles=num_particles,
-            particles_dim=1,
-            seed=test_util.test_seed()))
-
-    self.assertAllEqual([num_timesteps,
-                         batch_shape[0],
-                         num_particles,
-                         batch_shape[1]],
-                        trajectories['position'].shape)
-    self.assertAllEqual([num_timesteps,
-                         batch_shape[0],
-                         num_particles,
-                         batch_shape[1]],
-                        trajectories['velocity'].shape)
-    self.assertAllEqual(incremental_log_marginal_likelihoods.shape,
-                        [num_timesteps] + batch_shape)
-
-  def test_reconstruct_trajectories_toy_example(self):
-    particles = tf.convert_to_tensor([[1, 2, 3], [4, 5, 6,], [7, 8, 9]])
-    # 1  --  4  -- 7
-    # 2  \/  5  .- 8
-    # 3  /\  6 /-- 9
-    parent_indices = tf.convert_to_tensor([[0, 1, 2], [0, 2, 1], [0, 2, 2]])
-
-    trajectories = self.evaluate(
-        particle_filter.reconstruct_trajectories(particles, parent_indices))
-    self.assertAllEqual(
-        np.array([[1, 2, 2], [4, 6, 6], [7, 8, 9]]), trajectories)
-
-  def test_epidemiological_model(self):
-    # A toy, discrete version of an SIR (Susceptible, Infected, Recovered)
-    # model (https://en.wikipedia.org/wiki/Compartmental_models_in_epidemiology)
-
-    population_size = 1000
-    infection_rate = tf.convert_to_tensor(1.1)
-    infectious_period = tf.convert_to_tensor(8.0)
-
-    initial_state_prior = jdn.JointDistributionNamed({
-        'susceptible': deterministic.Deterministic(999.),
-        'infected': deterministic.Deterministic(1.),
-        'new_infections': deterministic.Deterministic(1.),
-        'new_recoveries': deterministic.Deterministic(0.)
-    })
-
-    # Dynamics model: new infections and recoveries are given by the SIR
-    # model with Poisson noise.
-    def infection_dynamics(_, previous_state):
-      new_infections = poisson.Poisson(
-          infection_rate * previous_state['infected'] *
-          previous_state['susceptible'] / population_size)
-      new_recoveries = poisson.Poisson(previous_state['infected'] /
-                                       infectious_period)
-
-      def susceptible(new_infections):
-        return deterministic.Deterministic(
-            ps.maximum(0., previous_state['susceptible'] - new_infections))
-
-      def infected(new_infections, new_recoveries):
-        return deterministic.Deterministic(
-            ps.maximum(
-                0.,
-                previous_state['infected'] + new_infections - new_recoveries))
-
-      return jdn.JointDistributionNamed({
-          'new_infections': new_infections,
-          'new_recoveries': new_recoveries,
-          'susceptible': susceptible,
-          'infected': infected
-      })
-
-    # Observation model: each day we detect new cases, noisily.
-    def infection_observations(_, state):
-      return poisson.Poisson(state['infected'])
-
-    # pylint: disable=bad-whitespace
-    observations = tf.convert_to_tensor([
-        0.,     4.,   1.,   5.,  23.,  27.,  75., 127., 248., 384., 540., 683.,
-        714., 611., 561., 493., 385., 348., 300., 277., 249., 219., 216., 174.,
-        132., 122., 115.,  99.,  76.,  84.,  77.,  56.,  42.,  56.,  46.,  38.,
-        34.,   44.,  25.,  27.])
-    # pylint: enable=bad-whitespace
-
-    trajectories, _ = self.evaluate(
-        particle_filter.infer_trajectories(
-            observations=observations,
-            initial_state_prior=initial_state_prior,
-            transition_fn=infection_dynamics,
-            observation_fn=infection_observations,
-            num_particles=100,
-            seed=test_util.test_seed()))
-
-    # The susceptible population should decrease over time.
-    self.assertAllLessEqual(
-        trajectories['susceptible'][1:, ...] -
-        trajectories['susceptible'][:-1, ...],
-        0.0)
-
-  def test_data_driven_proposal(self):
-
-    num_particles = 100
-    observations = tf.convert_to_tensor([60., -179.2, 1337.42])
-
-    # Define a system constrained primarily by observations, where proposing
-    # from the dynamics would be a bad fit.
-    initial_state_prior = normal.Normal(loc=0., scale=1e6)
-    transition_fn = (
-        lambda _, previous_state: normal.Normal(loc=previous_state, scale=1e6))
-    observation_fn = lambda _, state: normal.Normal(loc=state, scale=0.1)
-    initial_state_proposal = normal.Normal(loc=observations[0], scale=0.1)
-    proposal_fn = (
-        lambda step, state: normal.Normal(  # pylint: disable=g-long-lambda
-            loc=tf.ones_like(state) * observations[step + 1],
-            scale=1.0))
-
-    trajectories, _ = self.evaluate(
-        particle_filter.infer_trajectories(
-            observations=observations,
-            initial_state_prior=initial_state_prior,
-            transition_fn=transition_fn,
-            observation_fn=observation_fn,
-            num_particles=num_particles,
-            initial_state_proposal=initial_state_proposal,
-            proposal_fn=proposal_fn,
-            seed=test_util.test_seed()))
-    self.assertAllClose(trajectories,
-                        tf.convert_to_tensor(
-                            tf.convert_to_tensor(
-                                observations)[..., tf.newaxis] *
-                            tf.ones([num_particles])), atol=1.0)
-
-  def test_estimated_prob_approximates_true_prob(self):
-
-    # Draw simulated data from a 2D linear Gaussian system.
-    initial_state_prior = mvn_diag.MultivariateNormalDiag(
-        loc=0., scale_diag=(1., 1.))
-    transition_matrix = tf.convert_to_tensor([[1., -0.5], [0.4, -1.]])
-    transition_noise = mvn_tril.MultivariateNormalTriL(
-        loc=1., scale_tril=tf.convert_to_tensor([[0.3, 0], [-0.1, 0.2]]))
-    observation_matrix = tf.convert_to_tensor([[0.1, 1.], [1., 0.2]])
-    observation_noise = mvn_tril.MultivariateNormalTriL(
-        loc=-0.3, scale_tril=tf.convert_to_tensor([[0.5, 0], [0.1, 0.5]]))
-    model = lgssm.LinearGaussianStateSpaceModel(
-        num_timesteps=20,
-        initial_state_prior=initial_state_prior,
-        transition_matrix=transition_matrix,
-        transition_noise=transition_noise,
-        observation_matrix=observation_matrix,
-        observation_noise=observation_noise)
-    observations = self.evaluate(
-        model.sample(seed=test_util.test_seed()))
-    (lps, filtered_means,
-     _, _, _, _, _) = self.evaluate(model.forward_filter(observations))
-
-    # Approximate the filtering means and marginal likelihood(s) using
-    # the particle filter.
-    # pylint: disable=g-long-lambda
-    (particles, log_weights, _,
-     estimated_incremental_log_marginal_likelihoods) = self.evaluate(
-         particle_filter.particle_filter(
-             observations=observations,
-             initial_state_prior=initial_state_prior,
-             transition_fn=lambda _, previous_state: mvn_tril.
-             MultivariateNormalTriL(
-                 loc=transition_noise.loc + tf.linalg.matvec(
-                     transition_matrix, previous_state),
-                 scale_tril=transition_noise.scale_tril),
-             observation_fn=lambda _, state: mvn_tril.MultivariateNormalTriL(
-                 loc=observation_noise.loc + tf.linalg.matvec(
-                     observation_matrix, state),
-                 scale_tril=observation_noise.scale_tril),
-             num_particles=1024,
-             seed=test_util.test_seed()))
-    # pylint: enable=g-long-lambda
-
-    particle_means = np.sum(
-        particles * np.exp(log_weights)[..., np.newaxis], axis=1)
-    self.assertAllClose(filtered_means, particle_means, atol=0.1, rtol=0.1)
-
-    self.assertAllClose(
-        lps, estimated_incremental_log_marginal_likelihoods, atol=0.6)
-
-  def test_proposal_weights_dont_affect_marginal_likelihood(self):
-    observation = np.array([-1.3, 0.7]).astype(self.dtype)
-    # This particle filter has proposals different from the dynamics,
-    # so internally it will use proposal weights in addition to observation
-    # weights. It should still get the observation likelihood correct.
-    _, lps = self.evaluate(
-        particle_filter.infer_trajectories(
-            observation,
-            initial_state_prior=normal.Normal(loc=0., scale=1.),
-            transition_fn=lambda _, x: normal.Normal(loc=x, scale=1.),
-            observation_fn=lambda _, x: normal.Normal(loc=x, scale=1.),
-            initial_state_proposal=normal.Normal(loc=0., scale=5.),
-            proposal_fn=lambda _, x: normal.Normal(loc=x, scale=5.),
-            num_particles=2048,
-            seed=test_util.test_seed()))
-
-    # Compare marginal likelihood against that
-    # from the true (jointly normal) marginal distribution.
-    y1_marginal_dist = normal.Normal(loc=0., scale=np.sqrt(1. + 1.))
-    y2_conditional_dist = (
-        lambda y1: normal.Normal(loc=y1 / 2., scale=np.sqrt(5. / 2.)))
-    true_lps = tf.stack(
-        [y1_marginal_dist.log_prob(observation[0]),
-         y2_conditional_dist(observation[0]).log_prob(observation[1])],
-        axis=0)
-    # The following line passes at atol = 0.01 if num_particles = 32768.
-    self.assertAllClose(true_lps, lps, atol=0.2)
-
-  def test_can_step_dynamics_faster_than_observations(self):
-    initial_state_prior = jdn.JointDistributionNamed({
-        'position': deterministic.Deterministic(1.),
-        'velocity': deterministic.Deterministic(0.)
-    })
-
-    # Use 100 steps between observations to integrate a simple harmonic
-    # oscillator.
-    dt = 0.01
-    def simple_harmonic_motion_transition_fn(_, state):
-      return jdn.JointDistributionNamed({
-          'position':
-              normal.Normal(
-                  loc=state['position'] + dt * state['velocity'],
-                  scale=dt * 0.01),
-          'velocity':
-              normal.Normal(
-                  loc=state['velocity'] - dt * state['position'],
-                  scale=dt * 0.01)
-      })
-
-    def observe_position(_, state):
-      return normal.Normal(loc=state['position'], scale=0.01)
-
-    particles, _, _, lps = self.evaluate(
-        particle_filter.particle_filter(
-            # 'Observing' the values we'd expect from a proper integrator should
-            # give high likelihood if our discrete approximation is good.
-            observations=tf.convert_to_tensor(
-                [tf.math.cos(0.), tf.math.cos(1.)]),
-            initial_state_prior=initial_state_prior,
-            transition_fn=simple_harmonic_motion_transition_fn,
-            observation_fn=observe_position,
-            num_particles=1024,
-            num_transitions_per_observation=100,
-            seed=test_util.test_seed()))
-
-    self.assertLen(particles['position'], 101)
-    self.assertAllClose(np.mean(particles['position'], axis=-1),
-                        tf.math.cos(dt * np.arange(101)),
-                        atol=0.04)
-    self.assertLen(lps, 101)
-    self.assertGreater(lps[0], 3.)
-    self.assertGreater(lps[-1], 3.)
-
-  def test_custom_trace_fn(self):
-
-    def trace_fn(state, _):
-      # Traces the mean and stddev of the particle population at each step.
-      weights = tf.exp(state.log_weights)
-      mean = tf.reduce_sum(weights * state.particles, axis=0)
-      variance = tf.reduce_sum(
-          weights * (state.particles - mean[tf.newaxis, ...])**2)
-      return {'mean': mean,
-              'stddev': tf.sqrt(variance),
-              # In real usage we would likely not track the particles and
-              # weights. We keep them here just so we can double-check the
-              # stats, below.
-              'particles': state.particles,
-              'weights': weights}
-
-    results = self.evaluate(
-        particle_filter.particle_filter(
-            observations=tf.convert_to_tensor([1., 3., 5., 7., 9.]),
-            initial_state_prior=normal.Normal(0., 1.),
-            transition_fn=lambda _, state: normal.Normal(state, 1.),
-            observation_fn=lambda _, state: normal.Normal(state, 1.),
-            num_particles=1024,
-            trace_fn=trace_fn,
-            seed=test_util.test_seed()))
-
-    # Verify that posterior means are increasing.
-    self.assertAllGreater(results['mean'][1:] - results['mean'][:-1], 0.)
-
-    # Check that our traced means and scales match values computed
-    # by averaging over particles after the fact.
-    all_means = self.evaluate(tf.reduce_sum(
-        results['weights'] * results['particles'], axis=1))
-    all_variances = self.evaluate(
-        tf.reduce_sum(
-            results['weights'] *
-            (results['particles'] - all_means[..., tf.newaxis])**2,
-            axis=1))
-    self.assertAllClose(results['mean'], all_means)
-    self.assertAllClose(results['stddev'], np.sqrt(all_variances))
-
-  def test_step_indices_to_trace(self):
-    num_particles = 1024
-    (particles_1_3, log_weights_1_3, parent_indices_1_3,
-     incremental_log_marginal_likelihood_1_3) = self.evaluate(
-         particle_filter.particle_filter(
-             observations=tf.convert_to_tensor([1., 3., 5., 7., 9.]),
-             initial_state_prior=normal.Normal(0., 1.),
-             transition_fn=lambda _, state: normal.Normal(state, 10.),
-             observation_fn=lambda _, state: normal.Normal(state, 0.1),
-             num_particles=num_particles,
-             trace_criterion_fn=lambda s, r: ps.logical_or(  # pylint: disable=g-long-lambda
-                 ps.equal(r.steps, 2), ps.equal(r.steps, 4)),
-             static_trace_allocation_size=2,
-             seed=test_util.test_seed()))
-    self.assertLen(particles_1_3, 2)
-    self.assertLen(log_weights_1_3, 2)
-    self.assertLen(parent_indices_1_3, 2)
-    self.assertLen(incremental_log_marginal_likelihood_1_3, 2)
-    means = np.sum(np.exp(log_weights_1_3) * particles_1_3, axis=1)
-    self.assertAllClose(means, [3., 7.], atol=1.)
-
-    (final_particles, final_log_weights, final_cumulative_lp) = self.evaluate(
-        particle_filter.particle_filter(
-            observations=tf.convert_to_tensor([1., 3., 5., 7., 9.]),
-            initial_state_prior=normal.Normal(0., 1.),
-            transition_fn=lambda _, state: normal.Normal(state, 10.),
-            observation_fn=lambda _, state: normal.Normal(state, 0.1),
-            num_particles=num_particles,
-            trace_fn=lambda s, r: (  # pylint: disable=g-long-lambda
-                s.particles,
-                s.log_weights,
-                r.accumulated_log_marginal_likelihood),
-            trace_criterion_fn=None,
-            seed=test_util.test_seed()))
-    self.assertLen(final_particles, num_particles)
-    self.assertLen(final_log_weights, num_particles)
-    self.assertEqual(final_cumulative_lp.shape, ())
-    means = np.sum(np.exp(final_log_weights) * final_particles)
-    self.assertAllClose(means, 9., atol=1.5)
-
-  def test_warns_if_transition_distribution_has_unexpected_shape(self):
-
-    initial_state_prior = jdab.JointDistributionNamedAutoBatched({
-        'sales': deterministic.Deterministic(0.),
-        'inventory': deterministic.Deterministic(1000.)
-    })
-
-    # Inventory decreases by a Poisson RV 'sales', but is lower bounded at zero.
-    def valid_transition_fn(_, particles):
-      return jdab.JointDistributionNamedAutoBatched(
-          {
-              'sales':
-                  poisson.Poisson(10. * tf.ones_like(particles['inventory'])),
-              'inventory':
-                  lambda sales: deterministic.Deterministic(  # pylint: disable=g-long-lambda
-                      tf.maximum(0., particles['inventory'] - sales))
-          },
-          batch_ndims=1,
-          validate_args=True)
-
-    def dummy_observation_fn(_, state):
-      return normal.Normal(state['inventory'], 1000.)
-
-    run_filter = functools.partial(
-        particle_filter.particle_filter,
-        observations=tf.zeros([10]),
-        initial_state_prior=initial_state_prior,
-        observation_fn=dummy_observation_fn,
-        num_particles=3,
-        seed=test_util.test_seed(sampler_type='stateless'))
-
-    # Check that the model runs as written.
-    self.evaluate(run_filter(transition_fn=valid_transition_fn))
-    self.evaluate(run_filter(transition_fn=valid_transition_fn,
-                             proposal_fn=valid_transition_fn))
-
-    # Check that broken transition functions raise exceptions.
-    def transition_fn_broadcasts_over_particles(_, particles):
-      return jdn.JointDistributionNamed(
-          {
-              'sales':
-                  poisson.Poisson(10.
-                                 ),  # Proposes same value for all particles.
-              'inventory':
-                  lambda sales: deterministic.Deterministic(  # pylint: disable=g-long-lambda
-                      tf.maximum(0., particles['inventory'] - sales))
-          },
-          validate_args=True)
-
-    def transition_fn_partial_batch_shape(_, particles):
-      return jdn.JointDistributionNamed(
-          # Using `Sample` ensures iid proposals for each particle, but not
-          # per-particle log probs.
-          {
-              'sales':
-                  sample_dist_lib.Sample(
-                      poisson.Poisson(10.), ps.shape(particles['sales'])),
-              'inventory':
-                  lambda sales: deterministic.Deterministic(  # pylint: disable=g-long-lambda
-                      tf.maximum(0., particles['inventory'] - sales))
-          },
-          validate_args=True)
-
-    def transition_fn_no_batch_shape(_, particles):
-      # Autobatched JD defaults to treating num_particles as event shape, but
-      # we need it to be batch shape to get per-particle logprobs.
-      return jdab.JointDistributionNamedAutoBatched(
-          {
-              'sales':
-                  poisson.Poisson(10. * tf.ones_like(particles['inventory'])),
-              'inventory':
-                  lambda sales: deterministic.Deterministic(  # pylint: disable=g-long-lambda
-                      tf.maximum(0., particles['inventory'] - sales))
-          },
-          validate_args=True)
-
-    with self.assertRaisesRegex(ValueError, 'transition distribution'):
-      self.evaluate(
-          run_filter(transition_fn=transition_fn_broadcasts_over_particles))
-    with self.assertRaisesRegex(ValueError, 'transition distribution'):
-      self.evaluate(
-          run_filter(transition_fn=transition_fn_partial_batch_shape))
-    with self.assertRaisesRegex(ValueError, 'transition distribution'):
-      self.evaluate(
-          run_filter(transition_fn=transition_fn_no_batch_shape))
-
-    with self.assertRaisesRegex(ValueError, 'proposal distribution'):
-      self.evaluate(
-          run_filter(transition_fn=valid_transition_fn,
-                     proposal_fn=transition_fn_partial_batch_shape))
-    with self.assertRaisesRegex(ValueError, 'proposal distribution'):
-      self.evaluate(
-          run_filter(transition_fn=valid_transition_fn,
-                     proposal_fn=transition_fn_broadcasts_over_particles))
-
-    with self.assertRaisesRegex(ValueError, 'proposal distribution'):
-      self.evaluate(
-          run_filter(transition_fn=valid_transition_fn,
-                     proposal_fn=transition_fn_no_batch_shape))
-
-  @test_util.jax_disable_test_missing_functionality('Gradient of while_loop.')
-  def test_marginal_likelihood_gradients_are_defined(self):
-
-    def marginal_log_likelihood(level_scale, noise_scale):
-      _, _, _, lps = particle_filter.particle_filter(
-          observations=tf.convert_to_tensor([1., 2., 3., 4., 5.]),
-          initial_state_prior=normal.Normal(loc=0, scale=1.),
-          transition_fn=lambda _, x: normal.Normal(loc=x, scale=level_scale),
-          observation_fn=lambda _, x: normal.Normal(loc=x, scale=noise_scale),
-          num_particles=4,
-          seed=test_util.test_seed())
-      return tf.reduce_sum(lps)
-
-    _, grads = gradient.value_and_gradient(marginal_log_likelihood, 1.0, 1.0)
-    self.assertAllNotNone(grads)
-    self.assertAllAssertsNested(self.assertNotAllZero, grads)
-
   def test_smc_squared_rejuvenation_parameters(self):
     def particle_dynamics(params, _, previous_state):
       reshaped_params = tf.reshape(params,
@@ -742,7 +48,12 @@ def particle_dynamics(params, _, previous_state):
                                    [1] * (previous_state.shape.rank - 1))
       broadcasted_params = tf.broadcast_to(reshaped_params,
                                            previous_state.shape)
-      return normal.Normal(previous_state + broadcasted_params + 1, 0.1)
+      reshaped_dist = independent.Independent(
+          normal.Normal(previous_state + broadcasted_params + 1, 0.1),
+          reinterpreted_batch_ndims=1
+      )
+
+      return reshaped_dist
 
     def rejuvenation_criterion(step, state):
       # Rejuvenation every 2 steps
@@ -753,7 +64,8 @@ def rejuvenation_criterion(step, state):
       return tf.cond(cond, lambda: tf.constant(True),
                      lambda: tf.constant(False))
 
-    inner_observations = tf.range(30, dtype=tf.float32)
+    observations = tf.stack([tf.range(30, dtype=tf.float32),
+                             tf.range(30, dtype=tf.float32)], axis=1)
 
     num_outer_particles = 3
     num_inner_particles = 7
@@ -762,7 +74,7 @@ def rejuvenation_criterion(step, state):
     scale_diag = tf.broadcast_to([0.05, 0.05], [num_outer_particles, 2])
 
     params, _ = self.evaluate(particle_filter.smc_squared(
-        inner_observations=inner_observations,
+        observations=observations,
         inner_initial_state_prior=lambda _, params:
         mvn_diag.MultivariateNormalDiag(
             loc=loc, scale_diag=scale_diag
@@ -771,10 +83,8 @@ def rejuvenation_criterion(step, state):
         num_outer_particles=num_outer_particles,
         num_inner_particles=num_inner_particles,
         outer_rejuvenation_criterion_fn=rejuvenation_criterion,
-        inner_transition_fn=lambda params: (
-            lambda _, state: independent.Independent(
-                particle_dynamics(params, _, state), 1)
-        ),
+        inner_transition_fn=lambda params:
+            lambda _, state: particle_dynamics(params, _, state),
         inner_observation_fn=lambda params: (
             lambda _, state: independent.Independent(
                 normal.Normal(state, 2.), 1)
@@ -794,148 +104,6 @@ def rejuvenation_criterion(step, state):
 
     self.assertAllTrue(mask_parameters)
 
-  def test_smc_squared_can_step_dynamics_faster_than_observations(self):
-    initial_state_prior = jdn.JointDistributionNamed({
-        'position': deterministic.Deterministic([1.]),
-        'velocity': deterministic.Deterministic([0.])
-    })
-
-    # Use 100 steps between observations to integrate a simple harmonic
-    # oscillator.
-    dt = 0.01
-    def simple_harmonic_motion_transition_fn(_, state):
-      return jdn.JointDistributionNamed({
-          'position':
-              normal.Normal(
-                  loc=state['position'] + dt * state['velocity'],
-                  scale=dt * 0.01),
-          'velocity':
-              normal.Normal(
-                  loc=state['velocity'] - dt * state['position'],
-                  scale=dt * 0.01)
-      })
-
-    def observe_position(_, state):
-      return normal.Normal(loc=state['position'], scale=0.01)
-
-    particles, lps = self.evaluate(particle_filter.smc_squared(
-        inner_observations=tf.convert_to_tensor(
-            [tf.math.cos(0.), tf.math.cos(1.)]),
-        inner_initial_state_prior=lambda _, params: initial_state_prior,
-        initial_parameter_prior=deterministic.Deterministic(0.),
-        num_outer_particles=1,
-        inner_transition_fn=lambda params:
-        simple_harmonic_motion_transition_fn,
-        inner_observation_fn=lambda params: observe_position,
-        num_inner_particles=1024,
-        outer_trace_fn=lambda s, r: (
-            s.particles[1].particles,
-            s.particles[3]
-        ),
-        num_transitions_per_observation=100,
-        seed=test_util.test_seed())
-    )
-
-    self.assertAllEqual(ps.shape(particles['position']), tf.constant([102,
-                                                                      1,
-                                                                      1024]))
-
-    self.assertAllClose(tf.transpose(np.mean(particles['position'], axis=-1)),
-                        tf.reshape(tf.math.cos(dt * np.arange(102)), [1, -1]),
-                        atol=0.04)
-
-    self.assertAllEqual(ps.shape(lps), [102, 1])
-    self.assertGreater(lps[1][0], 1.)
-    self.assertGreater(lps[-1][0], 3.)
-
-  def test_smc_squared_custom_outer_trace_fn(self):
-    def trace_fn(state, _):
-      # Traces the mean and stddev of the particle population at each step.
-      weights = tf.exp(state[0][1].log_weights[0])
-      mean = tf.reduce_sum(weights * state[0][1].particles[0], axis=0)
-      variance = tf.reduce_sum(
-          weights * (state[0][1].particles[0] - mean[tf.newaxis, ...]) ** 2)
-      return {'mean': mean,
-              'stddev': tf.sqrt(variance),
-              # In real usage we would likely not track the particles and
-              # weights. We keep them here just so we can double-check the
-              # stats, below.
-              'particles': state[0][1].particles[0],
-              'weights': weights}
-
-    results = self.evaluate(particle_filter.smc_squared(
-        inner_observations=tf.convert_to_tensor([1., 3., 5., 7., 9.]),
-        inner_initial_state_prior=lambda _, params: normal.Normal([0.], 1.),
-        initial_parameter_prior=deterministic.Deterministic(0.),
-        inner_transition_fn=lambda params: (lambda _, state:
-                                            normal.Normal(state, 1.)),
-        inner_observation_fn=lambda params: (lambda _, state:
-                                             normal.Normal(state, 1.)),
-        num_inner_particles=1024,
-        num_outer_particles=1,
-        outer_trace_fn=trace_fn,
-        seed=test_util.test_seed())
-    )
-
-    # Verify that posterior means are increasing.
-    self.assertAllGreater(results['mean'][1:] - results['mean'][:-1], 0.)
-
-    # Check that our traced means and scales match values computed
-    # by averaging over particles after the fact.
-    all_means = self.evaluate(tf.reduce_sum(
-        results['weights'] * results['particles'], axis=1))
-    all_variances = self.evaluate(
-        tf.reduce_sum(
-            results['weights'] *
-            (results['particles'] - all_means[..., tf.newaxis])**2,
-            axis=1))
-    self.assertAllClose(results['mean'], all_means)
-    self.assertAllClose(results['stddev'], np.sqrt(all_variances))
-
-  def test_smc_squared_indices_to_trace(self):
-    num_outer_particles = 7
-    num_inner_particles = 13
-
-    def rejuvenation_criterion(step, state):
-      # Rejuvenation every 3 steps
-      cond = tf.logical_and(
-          tf.equal(tf.math.mod(step, tf.constant(3)), tf.constant(0)),
-          tf.not_equal(state.extra[0], tf.constant(0))
-      )
-      return tf.cond(cond, lambda: tf.constant(True),
-                     lambda: tf.constant(False))
-
-    (parameters, weight_parameters,
-     inner_particles, inner_log_weights, lp) = self.evaluate(
-        particle_filter.smc_squared(
-            inner_observations=tf.convert_to_tensor([1., 3., 5., 7., 9.]),
-            initial_parameter_prior=deterministic.Deterministic(0.),
-            inner_initial_state_prior=lambda _, params: normal.Normal(
-                [0.] * num_outer_particles, 1.
-            ),
-            inner_transition_fn=lambda params:
-            (lambda _, state: normal.Normal(state, 10.)),
-            inner_observation_fn=lambda params:
-            (lambda _, state: normal.Normal(state, 0.1)),
-            num_inner_particles=num_inner_particles,
-            num_outer_particles=num_outer_particles,
-            outer_rejuvenation_criterion_fn=rejuvenation_criterion,
-            outer_trace_fn=lambda s, r: (  # pylint: disable=g-long-lambda
-                s.particles[0],
-                s.log_weights,
-                s.particles[1].particles,
-                s.particles[1].log_weights,
-                r.accumulated_log_marginal_likelihood),
-            seed=test_util.test_seed())
-    )
-
-    # TODO: smc_squared at the moment starts his run with an empty step
-    self.assertAllEqual(ps.shape(parameters), [6, 7])
-    self.assertAllEqual(ps.shape(weight_parameters), [6, 7])
-    self.assertAllEqual(ps.shape(inner_particles), [6, 7, 13])
-    self.assertAllEqual(ps.shape(inner_log_weights), [6, 7, 13])
-    self.assertAllEqual(ps.shape(lp), [6])
-
 
 # TODO(b/186068104): add tests with dynamic shapes.
 class ParticleFilterTestFloat32(_ParticleFilterTest):