pymc-devs · junpenglao · Dec 5, 2017 · Oct 18, 2017 · Nov 9, 2017 · Nov 14, 2017
diff --git a/pymc3/examples/samplers_mvnormal.py b/pymc3/examples/samplers_mvnormal.py
@@ -0,0 +1,100 @@
+"""
+Comparing different samplers on a correlated bivariate normal distribution.
+
+This example will sample a bivariate normal with Metropolis, NUTS and DEMetropolis
+at two correlations (0, 0.9) and print out the effective sample sizes, runtime and
+normalized effective sampling rates.
+"""
+
+
+import numpy as np
+import time
+import pandas as pd
+import pymc3 as pm
+import theano.tensor as tt
+
+# with this flag one can switch between defining the bivariate normal as
+# either a 2D MvNormal (USE_XY = False) split up the two dimensions into
+# two variables 'x' and 'y'.  The latter is recommended because it highlights
+# different behaviour with respect to blocking.
+USE_XY = True
+
+def run(steppers, p):
+    steppers = set(steppers)
+    traces = {}
+    effn = {}
+    runtimes = {}
+
+    with pm.Model() as model:
+        if USE_XY:
+            x = pm.Flat('x')
+            y = pm.Flat('y')
+            mu = np.array([0.,0.])
+            cov = np.array([[1.,p],[p,1.]])
+            z = pm.MvNormal.dist(mu=mu, cov=cov, shape=(2,)).logp(tt.stack([x,y]))
+            pot = pm.Potential('logp_xy', z)
+            start = {'x': 0, 'y': 0}
+        else:
+            mu = np.array([0.,0.])
+            cov = np.array([[1.,p],[p,1.]])
+            z = pm.MvNormal('z', mu=mu, cov=cov, shape=(2,))
+            start={'z': [0, 0]}
+
+        for step_cls in steppers:
+            name = step_cls.__name__
+            t_start = time.time()
+            mt = pm.sample(
+                draws=10000,
+                chains=6,
+                step=step_cls(),
+                start=start
+            )
+            runtimes[name] = time.time() - t_start
+            print('{} samples across {} chains'.format(len(mt) * mt.nchains, mt.nchains))
+            traces[name] = mt
+            en = pm.diagnostics.effective_n(mt)
+            print('effective: {}\r\n'.format(en))
+            if USE_XY:
+                effn[name] = np.mean(en['x']) / len(mt) / mt.nchains
+            else:
+                effn[name] = np.mean(en['z']) / len(mt) / mt.nchains
+    return traces, effn, runtimes
+
+
+if __name__ == '__main__':
+    methods = [
+        pm.Metropolis,
+        pm.Slice,
+        pm.NUTS,
+        pm.DEMetropolis
+    ]
+    names = [c.__name__ for c in methods]
+
+    df_base = pd.DataFrame(columns=['p'] + names)
+    df_base['p'] = [.0,.9]
+    df_base = df_base.set_index('p')
+
+    df_effectiven = df_base.copy()
+    df_runtime = df_base.copy()
+    df_performance = df_base.copy()
+
+    for p in df_effectiven.index:
+        trace, rate, runtime = run(methods, p)
+        for name in names:
+            df_effectiven.set_value(p, name, rate[name])
+            df_runtime.set_value(p, name, runtime[name])
+            df_performance.set_value(p, name, rate[name] / runtime[name])
+
+    print('\r\nEffective sample size [0...1]')
+    print(df_effectiven.T.to_string(float_format='{:.3f}'.format))
+
+    print('\r\nRuntime [s]')
+    print(df_runtime.T.to_string(float_format='{:.1f}'.format))
+
+    if 'NUTS' in names:
+        print('\r\nNormalized effective sampling rate [0...1]')
+        df_performance = df_performance.T / df_performance.loc[0]['NUTS']
+    else:
+        print('\r\nNormalized effective sampling rate [1/s]')
+        df_performance = df_performance.T
+    print(df_performance.to_string(float_format='{:.3f}'.format))
diff --git a/pymc3/sampling.py b/pymc3/sampling.py
@@ -1,4 +1,5 @@
 from collections import defaultdict, Iterable
+from copy import copy
 import pickle
 
 from joblib import Parallel, delayed
@@ -10,6 +11,7 @@
 from .backends.base import BaseTrace, MultiTrace
 from .backends.ndarray import NDArray
 from .model import modelcontext, Point
+from .step_methods import arraystep
 from .step_methods import (NUTS, HamiltonianMC, SGFS, Metropolis, BinaryMetropolis,
                            BinaryGibbsMetropolis, CategoricalGibbsMetropolis,
                            Slice, CompoundStep)
@@ -143,6 +145,19 @@ def assign_step_methods(model, step=None, methods=STEP_METHODS,
     return instantiate_steppers(model, steps, selected_steps, step_kwargs)
 
 
+def print_step_hierarchy(s, level=0):
+    if isinstance(s, (list, tuple)):
+        pm._log.info('>' * level + 'list')
+        for i in s:
+            print_step_hierarchy(i, level+1)
+    elif isinstance(s, CompoundStep):
+        pm._log.info('>' * level + 'CompoundStep')
+        for i in s.methods:
+            print_step_hierarchy(i, level+1)
+    else:
+        pm._log.info('>' * level + '{}: {}'.format(s.__class__.__name__, s.vars))
+
+
 def _cpu_count():
     """Try to guess the number of CPUs in the system.
 
@@ -357,8 +372,10 @@ def sample(draws=500, step=None, init='auto', n_init=200000, start=None,
     else:
         step = assign_step_methods(model, step, step_kwargs=step_kwargs)
 
+    if isinstance(step, list):
+        step = CompoundStep(step)
     if start is None:
-        start = [None] * chains
+        start = {}
     if isinstance(start, dict):
         start = [start] * chains
 
@@ -380,23 +397,36 @@ def sample(draws=500, step=None, init='auto', n_init=200000, start=None,
 
     sample_args.update(kwargs)
 
-    parallel = njobs > 1 and chains > 1
+    has_population_samplers = np.any([
+        isinstance(m, arraystep.PopulationArrayStepShared)
+        for m in (step.methods if isinstance(step, CompoundStep) else [step])
+    ])
+    parallel = njobs > 1 and chains > 1 and not has_population_samplers
     if parallel:
+        pm._log.info('Multiprocess sampling ({} chains in {} jobs)'.format(chains, njobs))
+        print_step_hierarchy(step)
         try:
             trace = _mp_sample(**sample_args)
         except pickle.PickleError:
-            pm._log.warn("Could not pickle model, sampling sequentially.")
+            pm._log.warn("Could not pickle model, sampling singlethreaded.")
             pm._log.debug('Pickling error:', exec_info=True)
             parallel = False
         except AttributeError as e:
             if str(e).startswith("AttributeError: Can't pickle"):
-                pm._log.warn("Could not pickle model, sampling sequentially.")
+                pm._log.warn("Could not pickle model, sampling singlethreaded.")
                 pm._log.debug('Pickling error:', exec_info=True)
                 parallel = False
             else:
                 raise
     if not parallel:
-        trace = _sample_many(**sample_args)
+       if has_population_samplers:
+            pm._log.info('Population sampling ({} chains in 1 job)'.format(chains))
+            print_step_hierarchy(step)
+            trace = _sample_population(**sample_args)
+       else:
+            pm._log.info('Sequential sampling ({} chains in 1 job)'.format(chains))
+            print_step_hierarchy(step)
+            trace = _sample_many(**sample_args)
 
     discard = tune if discard_tuned_samples else 0
     return trace[discard:]
@@ -448,6 +478,23 @@ def _sample_many(draws, chain, chains, start, random_seed, **kwargs):
     return MultiTrace(traces)
 
 
+def _sample_population(draws, chain, chains, start, random_seed, step, tune,
+        model, progressbar=None, **kwargs):
+    # create the generator that iterates all chains in parallel
+    chains = [chain + c for c in range(chains)]
+    sampling = _iter_chains(draws, chains, step, start, tune=tune,
+                            model=model, random_seed=random_seed)
+
+    if progressbar:
+        sampling = tqdm(sampling, total=draws)
+
+    latest_traces = None
+    for it,traces in enumerate(sampling):
+        latest_traces = traces
+        # TODO: add support for liveplot during population-sampling
+    return MultiTrace(latest_traces)
+
+
 def _sample(chain, progressbar, random_seed, start, draws=None, step=None,
             trace=None, tune=None, model=None, live_plot=False,
             live_plot_kwargs=None, **kwargs):
@@ -580,6 +627,99 @@ def _iter_sample(draws, step, start=None, trace=None, chain=0, tune=None,
             step.report._finalize(strace)
 
 
+def _iter_chains(draws, chains, step, start, tune=None,
+                 model=None, random_seed=None):
+    # chains contains the chain numbers, but for indexing we need indices...
+    nchains = len(chains)
+    model = modelcontext(model)
+    draws = int(draws)
+    if random_seed is not None:
+        np.random.seed(random_seed)
+    if draws < 1:
+        raise ValueError('Argument `draws` should be above 0.')
+
+    # The initialization of traces, samplers and points must happen in the right order:
+    # 1. traces are initialized and update_start_vals configures variable transforms
+    # 2. population of points is created
+    # 3. steppers are initialized and linked to the points object
+    # 4. traces are configured to track the sampler stats
+
+
+    # 1. prepare a BaseTrace for each chain
+    traces = [_choose_backend(None, chain, model=model) for chain in chains]
+    for c,strace in enumerate(traces):
+        # initialize the trace size and variable transforms
+        if len(strace) > 0:
+            update_start_vals(start[c], strace.point(-1), model)
+        else:
+            update_start_vals(start[c], model.test_point, model)
+
+    # 2. create a population (points) that tracks each chain
+    # it is updated as the chains are advanced
+    points = [Point(start[c], model=model) for c in range(nchains)]
+    updates = [None] * nchains
+
+    # 3. Set up the steppers
+    steppers = [None] * nchains
+    for c in range(nchains):
+        # need indepenent samplers for each chain
+        # it is important to copy the actual steppers (but not the delta_logp)
+        if isinstance(step, CompoundStep):
+            chainstep = CompoundStep([copy(m) for m in step.methods])
+        else:
+            chainstep = copy(step)
+        # link population samplers to the shared population state
+        for sm in (chainstep.methods if isinstance(step, CompoundStep) else [chainstep]):
+            if isinstance(sm, arraystep.PopulationArrayStepShared):
+                sm.link_population(points, c)
+        steppers[c] = chainstep
+
+    # 4. configure tracking of sampler stats
+    for c in range(nchains):
+        if steppers[c].generates_stats and traces[c].supports_sampler_stats:
+            traces[c].setup(draws, c, steppers[c].stats_dtypes)
+        else:
+            traces[c].setup(draws, c)
+
+    try:
+        # iterate draws of all chains
+        for i in range(draws):
+            # step each of the chains
+            for c in range(nchains):
+                if i == tune:
+                    steppers[c] = stop_tuning(steppers[c])
+                updates[c] = steppers[c].step(points[c])
+
+            # apply the update to the points and record to the traces
+            for c,strace in enumerate(traces):
+                if steppers[c].generates_stats:
+                    points[c], states = updates[c]
+                    if strace.supports_sampler_stats:
+                        strace.record(points[c], states)
+                    else:
+                        strace.record(points[c])
+                else:
+                    points[c] = updates[c]
+                    strace.record(points[c])
+            # yield the state of all chains in parallel
+            yield traces
+    except KeyboardInterrupt:
+        for c,strace in enumerate(traces):
+            strace.close()
+            if hasattr(step, 'report'):
+                step.report._finalize(strace)
+        raise
+    except BaseException:
+        for c,strace in enumerate(traces):
+            strace.close()
+        raise
+    else:
+        for c,strace in enumerate(traces):
+            strace.close()
+            if hasattr(step, 'report'):
+                step.report._finalize(strace)
+
+
 def _choose_backend(trace, chain, shortcuts=None, **kwds):
     if isinstance(trace, BaseTrace):
         return trace

diff --git a/pymc3/step_methods/__init__.py b/pymc3/step_methods/__init__.py
@@ -3,6 +3,7 @@
 from .hmc import HamiltonianMC, NUTS
 
 from .metropolis import Metropolis
+from .metropolis import DEMetropolis
 from .metropolis import BinaryMetropolis
 from .metropolis import BinaryGibbsMetropolis
 from .metropolis import CategoricalGibbsMetropolis

diff --git a/pymc3/step_methods/arraystep.py b/pymc3/step_methods/arraystep.py
@@ -150,19 +150,58 @@ def __init__(self, vars, shared, blocked=True):
         self.ordering = ArrayOrdering(vars)
         self.shared = {str(var): shared for var, shared in shared.items()}
         self.blocked = blocked
+        self.bij = None
 
     def step(self, point):
         for var, share in self.shared.items():
             share.set_value(point[var])
 
-        bij = DictToArrayBijection(self.ordering, point)
+        self.bij = DictToArrayBijection(self.ordering, point)
 
         if self.generates_stats:
-            apoint, stats = self.astep(bij.map(point))
-            return bij.rmap(apoint), stats
+            apoint, stats = self.astep(self.bij.map(point))
+            return self.bij.rmap(apoint), stats
         else:
-            apoint = self.astep(bij.map(point))
-            return bij.rmap(apoint)
+            apoint = self.astep(self.bij.map(point))
+            return self.bij.rmap(apoint)
+
+
+class PopulationArrayStepShared(ArrayStepShared):
+    """Version of ArrayStepShared that allows samplers to access the states
+    of other chains in the population.
+
+    Works by linking a list of Points that is updated as the chains are iterated.
+    """
+
+    def __init__(self, vars, shared, blocked=True):
+        """
+        Parameters
+        ----------
+        vars : list of sampling variables
+        shared : dict of theano variable -> shared variable
+        blocked : Boolean (default True)
+        """
+        self.population = None
+        self.this_chain = None
+        self.other_chains = None
+        return super(PopulationArrayStepShared, self).__init__(vars, shared, blocked)
+
+    def link_population(self, population, chain_index):
+        """Links the sampler to the population.
+
+        Parameters
+        ----------
+        population : list of Points. (The elements of this list must be
+            replaced with current chain states in every iteration.)
+        chain_index : int of the index of this sampler in the population
+        """
+        self.population = population
+        self.this_chain = chain_index
+        self.other_chains = [c for c in range(len(population)) if c != chain_index]
+        if not len(self.other_chains) > 1:
+            raise ValueError('Population is just {} + {}. This is too small. You should ' \
+                'increase the number of chains.'.format(self.this_chain, self.other_chains))
+        return
 
 
 class GradientSharedStep(BlockedStep):