Variational inference with PyMC (#1306)

* variational inference fit * remove variational from sample * make pymc object accessible * save as McmcPtResult * tests added * add warning in write_result()
ICB-DCM · May 21, 2024 · fefefd5 · fefefd5
1 parent 7fe40ba
commit fefefd5
Show file tree

Hide file tree

Showing 6 changed files with 420 additions and 0 deletions.
diff --git a/pypesto/store/save_to_hdf5.py b/pypesto/store/save_to_hdf5.py
@@ -316,3 +316,9 @@ def write_result(
  if sample:
  pypesto_sample_writer = SamplingResultHDF5Writer(filename)
  pypesto_sample_writer.write(result, overwrite=overwrite)
+
+ if hasattr(result, "variational_result"):
+ logger.warning(
+ "Results from variational inference are not saved in the hdf5 file. "
+ "You have to save them manually."
+ )
diff --git a/pypesto/variational/__init__.py b/pypesto/variational/__init__.py
@@ -0,0 +1,9 @@
+"""
+Variational inference
+======
+
+Find the best variational approximation in a given family to a distribution from which we can sample.
+"""
+
+from .pymc import PymcVariational
+from .variational_inference import variational_fit
diff --git a/pypesto/variational/pymc.py b/pypesto/variational/pymc.py
@@ -0,0 +1,196 @@
+"""Pymc v4 Sampler for Variational Inference."""
+
+import logging
+from typing import Optional
+
+import numpy as np
+import pytensor.tensor as pt
+from scipy import stats
+
+from ..objective import FD
+from ..result import McmcPtResult
+from ..sample.pymc import PymcObjectiveOp, PymcSampler
+from ..sample.sampler import SamplerImportError
+
+logger = logging.getLogger(__name__)
+
+
+# implementation based on the pymc sampler code in pypesto and:
+# https://www.pymc.io/projects/examples/en/latest/variational_inference/variational_api_quickstart.html
+
+
+class PymcVariational(PymcSampler):
+ """Wrapper around Pymc v4 variational inference.
+
+ Parameters
+ ----------
+ step_function:
+ A pymc step function, e.g. NUTS, Slice. If not specified, pymc
+ determines one automatically (preferable).
+ **kwargs:
+ Options are directly passed on to `pymc.fit`.
+ """
+
+ def fit(
+ self,
+ n_iterations: int,
+ method: str = "advi",
+ random_seed: Optional[int] = None,
+ start_sigma: Optional = None,
+ inf_kwargs: Optional = None,
+ beta: float = 1.0,
+ **kwargs,
+ ):
+ """
+ Sample the problem.
+
+ Parameters
+ ----------
+ n_iterations:
+ Number of iterations.
+ method: str or :class:`Inference` of pymc
+ string name is case-insensitive in:
+ - 'advi' for ADVI
+ - 'fullrank_advi' for FullRankADVI
+ - 'svgd' for Stein Variational Gradient Descent
+ - 'asvgd' for Amortized Stein Variational Gradient Descent
+ random_seed: int
+ random seed for reproducibility
+ start_sigma: `dict[str, np.ndarray]`
+ starting standard deviation for inference, only available for method 'advi'
+ inf_kwargs: dict
+ additional kwargs passed to pymc.Inference
+ beta:
+ Inverse temperature (e.g. in parallel tempering).
+ """
+ try:
+ import pymc
+ except ImportError:
+ raise SamplerImportError("pymc") from None
+
+ problem = self.problem
+ if not problem.objective.has_grad:
+ logger.info(
+ "The objective function does not provide gradients. "
+ "Finite differences will be used."
+ )
+ problem.objective = FD(obj=problem.objective)
+ log_post = PymcObjectiveOp.create_instance(problem.objective, beta)
+
+ x0 = None
+ x_names_free = problem.get_reduced_vector(problem.x_names)
+ if self.x0 is not None:
+ x0 = {
+ x_name: val
+ for x_name, val in zip(problem.x_names, self.x0)
+ if x_name in x_names_free
+ }
+
+ # create model context
+ with pymc.Model():
+ # parameter bounds as uniform prior
+ _k = [
+ pymc.Uniform(x_name, lower=lb, upper=ub)
+ for x_name, lb, ub in zip(
+ x_names_free,
+ problem.lb,
+ problem.ub,
+ )
+ ]
+
+ # convert parameters to PyTensor tensor variable
+ theta = pt.as_tensor_variable(_k)
+
+ # define distribution with log-posterior as density
+ pymc.Potential("potential", log_post(theta))
+
+ # record function values
+ pymc.Deterministic("loggyposty", log_post(theta))
+
+ # perform the actual sampling
+ data = pymc.fit(
+ n=int(n_iterations),
+ method=method,
+ random_seed=random_seed,
+ start=x0,
+ start_sigma=start_sigma,
+ inf_kwargs=inf_kwargs,
+ **kwargs,
+ )
+
+ self.data = data
+
+ def sample(self, n_samples: int, beta: float = 1.0) -> McmcPtResult:
+ """
+ Sample from the variational approximation and return McmcPtResult object.
+
+ Parameters
+ ----------
+ n_samples:
+ Number of samples to be computed.
+ """
+ # get InferenceData object
+ pymc_data = self.data.sample(n_samples)
+ x_names_free = self.problem.get_reduced_vector(self.problem.x_names)
+ post_samples = np.concatenate(
+ [pymc_data.posterior[name].values for name in x_names_free]
+ ).T
+ return McmcPtResult(
+ trace_x=post_samples[np.newaxis, :],
+ trace_neglogpost=pymc_data.posterior.loggyposty.values,
+ trace_neglogprior=np.full(
+ pymc_data.posterior.loggyposty.values.shape, np.nan
+ ),
+ betas=np.array([1.0] * post_samples.shape[0]),
+ burn_in=0,
+ auto_correlation=0,
+ effective_sample_size=n_samples,
+ message="variational inference results",
+ )
+
+ def get_variational_parameters(self) -> (list, list):
+ """Get the internal pymc variational parameters."""
+ return (
+ [param.name for param in self.data.params],
+ [param.eval() for param in self.data.params],
+ )
+
+ def set_variational_parameters(self, param_list: list):
+ """
+ Set the internal pymc variational parameters.
+
+ Parameters
+ ----------
+ param_list:
+ List of tuples of the form (param_name, param_value).
+ """
+ if len(param_list) != len(self.data.params):
+ raise ValueError(
+ "The number of parameters does not match the number of variational parameters."
+ )
+ for i, param in enumerate(param_list):
+ self.data.params[i].set_value(param)
+
+ def eval_variational_log_density(self, x: np.ndarray) -> np.ndarray:
+ """
+ Evaluate the log density of the variational approximation at x_points.
+
+ Parameters
+ ----------
+ x:
+ The points at which to evaluate the log density.
+ """
+ # TODO: add support for other methods
+ logger.warning(
+ "currently only supports the methods `advi` and `fullrank_advi`"
+ )
+
+ if x.ndim == 1:
+ x = x.reshape(1, -1)
+ log_density_at_points = np.zeros_like(x)
+ for i, point in enumerate(x):
+ log_density_at_points[i] = stats.multivariate_normal.logpdf(
+ point, mean=self.data.mean.eval(), cov=self.data.cov.eval()
+ )
+ vi_log_density = np.sum(log_density_at_points, axis=-1)
+ return vi_log_density
diff --git a/pypesto/variational/variational_inference.py b/pypesto/variational/variational_inference.py
@@ -0,0 +1,136 @@
+"""Functions for variational inference accessible to the user. Currently only pymc is supported."""
+
+import logging
+from time import process_time
+from typing import Callable, List, Optional, Union
+
+import numpy as np
+
+from ..problem import Problem
+from ..result import Result
+from ..sample.util import bound_n_samples_from_env
+from ..store import autosave
+from .pymc import PymcVariational
+
+logger = logging.getLogger(__name__)
+
+
+def variational_fit(
+ problem: Problem,
+ n_iterations: int,
+ method: str = "advi",
+ n_samples: Optional[int] = None,
+ random_seed: Optional[int] = None,
+ start_sigma: Optional[dict[str, np.ndarray]] = None,
+ x0: Union[np.ndarray, List[np.ndarray]] = None,
+ result: Result = None,
+ filename: Union[str, Callable, None] = None,
+ overwrite: bool = False,
+ **kwargs,
+) -> Result:
+ """
+ Call to do parameter sampling.
+
+ Parameters
+ ----------
+ problem:
+ The problem to be solved. If None is provided, a
+ :class:`pypesto.AdaptiveMetropolisSampler` is used.
+ n_iterations:
+ Number of iterations for the optimization.
+ method: str or :class:`Inference` of pymc (only interface currently supported)
+ string name is case-insensitive in:
+ - 'advi' for ADVI
+ - 'fullrank_advi' for FullRankADVI
+ - 'svgd' for Stein Variational Gradient Descent
+ - 'asvgd' for Amortized Stein Variational Gradient Descent
+ n_samples:
+ Number of samples to generate after optimization.
+ random_seed: int
+ random seed for reproducibility
+ start_sigma: `dict[str, np.ndarray]`
+ starting standard deviation for inference, only available for method 'advi'
+ x0:
+ Initial parameter for the variational optimization. If None, the best parameter
+ found in optimization is used.
+ result:
+ A result to write to. If None provided, one is created from the
+ problem.
+ filename:
+ Name of the hdf5 file, where the result will be saved. Default is
+ None, which deactivates automatic saving. If set to
+ "Auto" it will automatically generate a file named
+ `year_month_day_profiling_result.hdf5`.
+ Optionally a method, see docs for `pypesto.store.auto.autosave`.
+ overwrite:
+ Whether to overwrite `result/sampling` in the autosave file
+ if it already exists.
+
+ Returns
+ -------
+ result:
+ A result with filled in sample_options part.
+ """
+ # prepare result object
+ if result is None:
+ result = Result(problem)
+
+ # number of samples
+ if n_iterations is not None:
+ n_iterations = bound_n_samples_from_env(n_iterations)
+
+ # try to find initial parameters
+ if x0 is None:
+ result.optimize_result.sort()
+ if len(result.optimize_result.list) > 0:
+ x0 = problem.get_reduced_vector(
+ result.optimize_result.list[0]["x"]
+ )
+
+ # set variational inference
+ # currently we only support pymc
+ variational = PymcVariational()
+
+ # initialize sampler to problem
+ variational.initialize(problem=problem, x0=x0)
+
+ # perform the sampling and track time
+ t_start = process_time()
+ variational.fit(
+ n_iterations=n_iterations,
+ method=method,
+ random_seed=random_seed,
+ start_sigma=start_sigma,
+ **kwargs,
+ )
+ t_elapsed = process_time() - t_start
+ logger.info("Elapsed time: " + str(t_elapsed))
+
+ # extract results and save samples to pypesto result
+ if n_samples is None or n_samples == 0:
+ # constructing a McmcPtResult object with nearly empty trace_x
+ n_samples = 1
+
+ result.sample_result = variational.sample(n_samples)
+ result.sample_result.time = t_elapsed
+
+ autosave(
+ filename=filename,
+ result=result,
+ store_type="sample",
+ overwrite=overwrite,
+ )
+
+ # make pymc object available in result
+ # TODO: if needed, we can add a result object for variational inference methods
+ result.variational_result = variational
+ (
+ result.sample_result.variational_parameters_names,
+ result.sample_result.variational_parameters,
+ ) = variational.get_variational_parameters()
+ if filename is not None:
+ logger.warning(
+ "Variational parameters are not saved in the hdf5 file. You have to save them manually."
+ )
+
+ return result
diff --git a/test/variational/__init__.py b/test/variational/__init__.py
@@ -0,0 +1 @@
+"""Variational inference tests."""