Source code for threeML.bayesian.multinest_sampler

import logging

import shutil
from pathlib import Path
from typing import Optional

import numpy as np
from astromodels import use_astromodels_memoization
from astromodels.core.model import Model

from threeML.bayesian.sampler_base import UnitCubeSampler
from threeML.config.config import threeML_config
from threeML.data_list import DataList


try:
    import pymultinest

except Exception:
    has_pymultinest = False

else:
    has_pymultinest = True


try:
    # see if we have mpi and/or are using parallel

    from mpi4py import MPI

    if MPI.COMM_WORLD.Get_size() > 1:  # need parallel capabilities
        using_mpi = True

        comm = MPI.COMM_WORLD
        rank = comm.Get_rank()

    else:
        using_mpi = False
except Exception:
    using_mpi = False

log = logging.getLogger(__name__)



[docs]
class MultiNestSampler(UnitCubeSampler):
    def __init__(
        self,
        likelihood_model: Optional[Model] = None,
        data_list: Optional[DataList] = None,
        **kwargs,
    ):
        """
        Implements the MultiNest sampler of https://github.com/farhanferoz/MultiNest
        via the python wrapper of https://github.com/JohannesBuchner/PyMultiNest

        :param likelihood_model:
        :param data_list:
        :returns:
        :rtype:

        """

        assert has_pymultinest, "You must install MultiNest to use this sampler"

        super(MultiNestSampler, self).__init__(likelihood_model, data_list, **kwargs)


[docs]
    def setup(
        self,
        n_live_points: int = 400,
        chain_name: str = "chains/fit-",
        resume: bool = False,
        importance_nested_sampling: bool = False,
        auto_clean: bool = False,
        **kwargs,
    ):
        """
        Setup the MultiNest Sampler. For details see:
        https://github.com/farhanferoz/MultiNest

        :param n_live_points: number of live points for the evaluation
        :param chain_name: the chain name
        :resume: resume from previous fit
        :param importance_nested_sampling: use INS
        :param auto_clean: automatically remove multinest chains after run
        :returns:
        :rtype:

        """
        log.debug(
            f"Setup for MultiNest sampler: n_live_points:{n_live_points}, chain_name:"
            f"{chain_name}, resume: {resume}, importance_nested_sampling: "
            f"{importance_nested_sampling}. Other input: {kwargs}"
        )
        self._kwargs = {}
        self._kwargs["n_live_points"] = n_live_points
        self._kwargs["outputfiles_basename"] = chain_name
        self._kwargs["importance_nested_sampling"] = importance_nested_sampling
        self._kwargs["chain_name"] = chain_name
        self._kwargs["resume"] = resume

        for k, v in kwargs.items():
            self._kwargs[k] = v

        self._auto_clean = auto_clean

        self._is_setup = True



[docs]
    def sample(self, quiet: bool = False):
        """Sample using the MultiNest numerical integration method.

        :returns:
        :rtype:
        """
        if not self._is_setup:
            log.info("You forgot to setup the sampler!")
            return

        assert has_pymultinest, (
            "You don't have pymultinest installed, so you cannot run the Multinest "
            "sampler"
        )

        loud = not quiet

        self._update_free_parameters()

        n_dim = len(list(self._free_parameters.keys()))

        # MULTINEST uses a different call signiture for
        # sampling so we construct callbakcs
        loglike, multinest_prior = self._construct_unitcube_posterior()

        # We need to check if the MCMC
        # chains will have a place on
        # the disk to write and if not,
        # create one

        chain_name = Path(self._kwargs.pop("chain_name"))

        chain_dir = chain_name.parent

        if using_mpi:
            # if we are running in parallel and this is not the
            # first engine, then we want to wait and let everything finish

            comm.Barrier()

            if rank == 0:
                # create mcmc chains directory only on first engine

                if not chain_dir.exists():
                    log.debug(f"Create {chain_dir} for multinest output")
                    chain_dir.mkdir()

        else:
            if not chain_dir.exists():
                log.debug(f"Create {chain_dir} for multinest output")
                chain_dir.mkdir()

        # Multinest must be run parallel via an external method
        # see the demo in the examples folder!!

        if threeML_config["parallel"]["use_parallel"]:
            log.error(
                "If you want to run multinest in parallell you need to use an ad-hoc"
                " method"
            )

            raise RuntimeError()

        else:
            with use_astromodels_memoization(False):
                log.debug("Start multinest run")
                sampler = pymultinest.run(
                    loglike, multinest_prior, n_dim, n_dim, **self._kwargs
                )
                log.debug("Multinest run done")

        # Use PyMULTINEST analyzer to gather parameter info

        process_fit = False

        if using_mpi:
            # if we are running in parallel and this is not the
            # first engine, then we want to wait and let everything finish

            comm.Barrier()

            if rank != 0:
                # these engines do not need to read
                process_fit = False

            else:
                process_fit = True

        else:
            process_fit = True

        if process_fit:
            multinest_analyzer = pymultinest.analyse.Analyzer(
                n_params=n_dim, outputfiles_basename=chain_name
            )

            # Get the log. likelihood values from the chain
            self._log_like_values = multinest_analyzer.get_equal_weighted_posterior()[
                :, -1
            ]

            self._sampler = sampler

            self._raw_samples = multinest_analyzer.get_equal_weighted_posterior()[
                :, :-1
            ]

            # now get the log probability

            self._log_probability_values = self._log_like_values + np.array(
                [self._log_prior(samples) for samples in self._raw_samples]
            )

            self._build_samples_dictionary()

            self._marginal_likelihood = multinest_analyzer.get_stats()[
                "global evidence"
            ] / np.log(10.0)

            self._build_results()

            # Display results
            if loud:
                self._results.display()

            # now clean up the chains if requested

            if self._auto_clean:
                log.info(f"deleting the chain directory {chain_dir}")

                shutil.rmtree(chain_dir)

            return self.samples