Source code for beansp.beans

"""Main module. This has functions that do the sampling, save the chains, and analyse the results."""

## Python packages required:
import matplotlib.pyplot as plt
from matplotlib.colors import LogNorm
import numpy as np
import pandas as pd
import emcee
from astropy.io import ascii
import astropy.units as u
import astropy.constants as const
from astropy.table import Table, Column, MaskedColumn
from astropy.time import Time, TimeDelta
from matplotlib.ticker import MaxNLocator
from scipy.stats import gaussian_kde
# import scipy.stats as stats
from scipy.interpolate import splrep, BSpline, splint
from chainconsumer import ChainConsumer
from multiprocessing import cpu_count
import os
import time
from configparser import ConfigParser
import pickle

import pkg_resources  # part of setuptools
try:
    # this will fail if the package is not pip-installed
    __version__ = pkg_resources.require("beansp")[0].version
except:
    # in which case just record the path
    __version__ = os.getcwd()

# Set the default font to Times; this doesn't seem to affect the
# ChainConsumer plots

plt.rcParams['font.family'] = 'serif'
plt.rcParams['font.serif'] = ['Times']
plt.rcParams['text.usetex'] = True

# Some constants & standard units

BSTART_ERR = 10*u.min # Default uncertainty for burst start times
M_NS = 1.4 # canonical NS mass [M_sun]
R_NS = 11.2 # canonical NS mass [km]
FLUX_U = 1e-9*u.erg/u.cm**2/u.s
FLUEN_U = 1e-6*u.erg/u.cm**2

# -------------------------------------------------------------------------#
## load local  modules
from .settle import settle
from .burstrain import generate_burst_train, next_burst, burstensemble
from .run_model import runmodel, burst_time_match
from .get_data import get_obs
from .mrprior import mr_prior
from .run_emcee import runemcee
from .analyse import get_param_uncert_obs, get_param_uncert_part, get_param_uncert

# -------------------------------------------------------------------------#


__all__ = (
    "Beans"
)

# Some example prior functions, or you can write your own for input to the code.

# Define priors for theta. mr prior function is located in mrprior.py


[docs]def lnZprior(z):
    """
    This beta function for the metallicity prior is from Andy Casey and is an
    approximation of the metallicity of a mock galaxy at 2.5-4.5 kpc for the
    location of SAX J1808.4-3658. Assuming ZCNO = 0.01 is average value.

    :param z: CNO metallicity (mass fraction)

    :return: prior probability
    """

    from scipy import stats

    beta = stats.beta
    ZCNO = 0.01

    return np.log(
        beta(10, 3).pdf((np.log10(z / ZCNO) + 3) / 3.75) / (3.75 * np.log(10) * z)
    )


[docs]def prior_func(theta_in):
    """
    This function is the default prior and implements a simple box prior
    for all the parameters

    :param theta_in: parameter vector, with *X*, *Z*, *Q_b*, *d*, *xi_b*,
      *xi_p*, and (optionally) *mass*, *radius*, *f_E* & *f_a*

    :return: prior probability
    """

    X, Z, Q_b, dist, xi_b, xi_p, *extra = theta_in
    mass, radius, f_E, f_a = extra+[M_NS, R_NS, 1.0, 1.0][len(extra):]

    # upper bound and lower bounds of each parameter defined here. Bounds were
    # found by considering an estimated value for each parameter then giving
    # reasonable limits.
    if (0.00001 < X < 0.76) and (0.00001 < Z < 0.056) and \
        (0.000001 <= Q_b < 5.0) and (1 < dist < 20) and \
        (0.01 < xi_b < 2) and (0.01 < xi_p < 2) and \
        (1 <= f_a < 100) and (1 <= f_E < 100) and \
        (1.15 < mass < 2.5) and (9 < radius < 17):
        return 0.0
    else:
        return -np.inf


[docs]def prior_1808(theta_in):
    """
    This function implements a simple box prior for all the parameters
    excluding mass, radius, and the metallicity, which come instead from
    :function:`beansp.beans.lnZprior`

    This prior is explicitly intended for use with SAX J1808.4-3658, and
    should only be used with extreme caution in other cases!

    :param theta_in: parameter vector, with *X*, *Z*, *Q_b*, *d*, *xi_b*,
      *xi_p*, *mass*, *radius*, and (optionally) *f_E* & *f_a*

    :return: prior probability
    """

    X, Z, Q_b, dist, xi_b, xi_p, *extra = theta_in
    mass, radius, f_E, f_a = extra+[M_NS, R_NS, 1.0, 1.0][len(extra):]

    # upper bound and lower bounds of each parameter defined here. Bounds were
    # found by considering an estimated value for each parameter then giving
    # reasonable limits.
    if (0.00001 < X < 0.76) and (Z > 0.000010000001) and \
        (0.000001 <= Q_b < 5.0) and (1 < dist < 20) and \
        (0.01 < xi_b < 2) and (0.01 < xi_p < 2) and \
        (1 <= f_a < 100) and (1 <= f_E < 100):

        return 0.0 + lnZprior(Z) + mr_prior(mass, radius)
    else:
        return -np.inf


[docs]def corr_goodwin19(burst, **kwargs):
    """
    This is an example Settle correction function that applies the correction
    of Goodwin et al. (2019), multiplying the recurrence time and burst
    energy by 0.65. With this correction there is no need to modify the
    alpha value.
    The ``**kwargs`` can be used to incorporate other parameters into the
    correction; from settle we pass the base flux F, mdot M, H-fraction X,
    metallicity Z, and neutron star radius R and mass M (none used for
    this example)

    :param burst: 3-element tuple output from settle, with alpha, trec [hr], and burst energy [1e39 erg], all values in the observer frame

    :return: tuple with any necessary corrections performed
    """

    return (burst[0], burst[1]*0.65, burst[2]*0.65)


def corr_kepler(burst, **kwargs):
    """
    This is an example Settle correction function that applies the correction
    to match kepler burst results.
    The ``**kwargs`` can be used to incorporate other parameters into the
    correction; from settle we pass the base flux F, mdot M, H-fraction X,
    metallicity Z, and neutron star radius R and mass M (none used for
    this example)

    :param burst: 3-element tuple output from settle, with alpha, trec [hr], and burst energy [1e39 erg], all values in the observer frame

    :return: tuple with any necessary corrections performed
    """

    #Scale Fluence
    Fluence_coef= [-0.01494263, 0.61500959,  0.13263262]
    E_error = Fluence_coef[0]*burst[2]**2 + Fluence_coef[1]*burst[2] + Fluence_coef[2]

    #Scale trec
    a = burst[1]; b = kwargs['Z']; c = kwargs['X']
    form = [1, a, b, c, a ** 2, a * b, a * c, b ** 2, b * c, c ** 2]
    tdel_coff = [4.00396086e-24,  1.78459388e+00, 6.37416752e+01, -4.06404901e+00,
                2.94290411e-02,  4.52264987e+00, -2.35649145e+00, -4.64376836e+02,
                -2.73559070e+01,  8.08332362e+00]
    intercept = -0.8976578105076352
    t_error = np.dot(tdel_coff,form) + intercept

    # alpha ~ tdel/E_b, thus scale alpha as well
    t_fac = (burst[1] - t_error) / burst[1]
    e_fac = (burst[2] - E_error) / burst[2]
    alp_scl = burst[0] * (1 - t_fac) / (1 - e_fac)

    return (alp_scl, t_error, E_error)


def model_str(model):
    """
    Prints a compressed string representation of the model dict, with
    selected parameters and reduced precision to reduce the size of the
    record saved to the .h5 file

    :param model: model dictionary as returned by runmodel

    :return: string representation of the model dict
    """

    return ("{'time': ["+','.join(['{:.4f}'.format(x) for x in model['time']]) \
        +"], 'mdot': ["+','.join(['{:.5f}'.format(x) for x in model['mdot']]) \
        +"], 'alpha': ["+','.join(['{:.3f}'.format(x) for x in model['alpha']]) \
        +"], 'e_b': ["+','.join(['{:.4f}'.format(x) for x in model['e_b']]) \
        +"]}").replace(' ','')


def mean_flux_spline(t1, t2, bean):
    """
    Calculates the mean flux between t1 and t2 from the spline set up at
    the __init__ phase

    :param t1: start time for averaging
    :param t2: end time for averaging
    :param bean: :class:`beansp.Beans` object, from which the remaining parameters are drawn:
      tck_s

    :result: mean flux
    """

    return splint(t1,t2,bean.tck_s)/(t2-t1)


def mean_flux_linear(t1, t2, bean):
    """
    Calculates the mean flux between ``t1`` and ``t2`` from the piecewise
    linear interpolation of ``tobs``, ``a``, ``b``

    :param t1: start time for averaging
    :param t2: end time for averaging
    :param bean: :class:`beansp.Beans` object, from which the remaining parameters are drawn:
      tobs, a, b

    :result: mean flux
    """

    tobs, a, b = bean.tobs, bean.a, bean.b
    na = len(a)

    if len(tobs) != na + 1 or len(b) != na:
        print("** ERROR ** some problem with tobs, a, b arrays")
        return -1
    # i1 is max of where t1 > tobs

    i1 = max(np.where(t1 > tobs))
    if len(i1) == 0:
        i1 = -1
    else:
        i1 = max(i1)

    i2 = max(np.where(t2 > tobs))
    if len(i2) == 0:
        i2 = -1
    else:
        i2 = max(i2)

    sum = 0.0
    if (i1 < 0) and (i2 < 0):

        # Modified this section to just report the flux from the first measurement

        sum += (t2 - t1) * (a[0] + b[0] * tobs[0])
    else:

        # Add the contribution from the start time through to tobs[0], using the
        # gradient between the first pair of observations

        if i1 < 0:
            sum = sum + (tobs[0] - t1) * np.mean(
                [a[0] + b[0] * t1, a[0] + b[0] * tobs[0]]
            )

        # Add the contributions between each pair of observations

        for i in range(max([0, i1]), min([i2, na - 1]) + 1):
            sum = sum + (min([t2, tobs[i + 1]]) - max([t1, tobs[i]])) * np.mean(
                [a[i] + b[i] * max([t1, tobs[i]]), a[i] + b[i] * min([t2, tobs[i + 1]])]
            )

        # Add the contribution for the last section which overlaps with the
        # observation times

        if i1 < na and i2 == na:
            sum = sum + (t2 - tobs[i2]) * np.mean(
                [a[i2 - 1] + b[i2 - 1] * tobs[i2], t2]
            )

        # Now add any contribution *completely* beyond the observations. Previously
        # this gave an exception

        if i1 == na and i2 == na:
            sum = sum + (t2 - t1) * np.mean(
                [a[na - 1] + b[na - 1] * t1, a[na - 1] + b[na - 1] * t2]
            )

    return sum / (t2 - t1)


def get_a_b(pflux, pfluxe, tobs):
    """
    Do piecewise continuous fits to the flux evolution, to determine the
    appropriate parameters for each interval for use by mean_flux_linear:

    :param pflux: persistent flux measurements to interpolate
    :param pfluxe: uncertainty on persistent flux (not used)
    :param tobs: time (midpoint of observation extent) for flux measurement
    :result: a, b arrays for use with mean_flux
    """

    # Now actually calculate the coefficients for the flux fit

    # Linear fit
    ng = len(tobs)

    b0 = np.zeros(ng - 1)
    a0 = np.zeros(ng - 1)

    for i in range(1, ng):
        b0[i - 1] = (pflux[i] - pflux[i - 1]) / (tobs[i] - tobs[i - 1])
        a0[i - 1] = pflux[i - 1] - b0[i - 1] * tobs[i - 1]

    return a0, b0


[docs]class Beans:
    """
    The main object class that includes the basic functionality required for
    beans. The code will read in burst (and observation) data and attempt to
    simulate bursts to match the observed burst properties. There are two
    principle modes; the original function generates a "train" of individual
    bursts, observed (for example) during a transient outburst, as for the
    original application to the 2002 outburst of SAX J1808.4-3658, observed
    with RXTE/PCA. The alternative is to match to a set of non-contiguous
    bursts ("ensemble" mode)
    """

    HAS_CONCORD = False
    try:
        # Required for the distance_limit method
        import concord as cd
        HAS_CONCORD = True
    except:
        pass

[docs]    def __init__(self, prior=prior_func, corr=None, config_file=None,
                 run_id="test", nwalkers=200, nsteps=100,
                 obsname=None, burstname=None, gtiname=None,
                 interp='linear', smooth=0.02,
                 theta= (0.58, 0.013, 0.4, 3.5, 1.0, 1.0, 1.5, 11.8),
                 stretch_a=2.0, fluen=True, alpha=True, 
                 numburstssim=3, bc=2.21, ref_ind=1, threads = 4,
                 test_model=True, restart=False, **kwargs):
        """
        Initialise a Beans object

        :param prior: prior function to use
        :param corr: correction function for bursts, or None
        :param config_file: file to read in configuration parameters (in
          which case the keyword params below are ignored)
        :param run_id: string identifier for the run, used to label all the
          result files, and where you want output to be saved
        :param nwalkers: number of walkers for the emcee run
        :param nsteps: number of MCMC steps to run
        :param obsname: name of the file including the flux history, from which
          the mdot is estimated to generate to generate the burst train
          (set ``obsname=None`` for a non-contiguous, or "ensemble" mode run)
        :param burstname: name of the burst data file, listing the bursts
        :param gtiname: name of the GTI file, set to ``None`` to turn off
          checking
        :param interp: interpolation mode for the flux; possible values are
          'linear', or 'spline'
        :param smooth: smoothing factor for spline interpolation
        :param theta: initial centroid values for walker model parameters, with
          *X*, *Z*, *Q_b*, *d*, *xi_b*, *xi_p*, and (optionally) *mass*,
          *radius*, *f_E* & *f_a*
        :param stretch_a: the Goodman & Weare (2010) stretch move scale parameter, passed to emcee
        :param fluen: set to True (default) to include the fluences in the
          data for comparison, or False to omit
        :param alpha: set to True (default) to include the alphas in the
          data for comparison, or False to omit
        :param numburstssim: number of bursts to simulate, for the "train" mode,
          both earlier and later than the reference burst; i.e. set to half
          the total number of bursts you want to simulate. Don't forget to
          account for missed bursts!
        :param bc: bolometric correction to adopt for the flux history (set
          to 1.0 if the fluxes are already bolometric):
        :param ref_ind: rank of "index" burst, against which the other burst
          times are relative to. For the "train" mode, should be around the
          middle of the predicted burst train. This burst will not be
          simulated but will be used as a reference to predict the other bursts.
        :param threads: number of threads for emcee to use (e.g. number of
          cores your computer has). Set to ``None`` to use all available
        :param test_model: flag to test the model during the setup process
        :param restart: set to ``True`` to continue a previously interrupted run

        :result: Beans object including all the required data
        """

        # Some housekeeping

        if 'ndim' in kwargs.keys():
            print ('\n** WARNING ** parameter ndim is redundant (ignored), setting from len of param array')
        if 'numburstsobs' in kwargs.keys():
            print ('\n** WARNING ** parameter numburstsobs is redundant (ignored), setting from len of burst data')
        if 'gti_checking' in kwargs.keys():
            print ('\n** WARNING ** parameter gti_checking is redundant (ignored), setting from value of gtiname param')

        # Conversion factor between model predicted burst energy and
        # observed fluence. Multiply by this value to convert the burst
        # energy from settle (in 1e39, the observer frame) to fluence at 1
        # kpc in units of 1e-6 erg/cm^2

        self.fluen_fac = ((1e39*u.erg/(4*np.pi*u.kpc**2))
            / (1e-6*u.erg/u.cm**2)).decompose()

        # Conversion factor between persistent flux (in units of 1e-9
        # erg/cm^2/s) and the accretion rate

        self.r1 = (1e-9*u.erg/u.cm**2/u.s*u.kpc**2
            / (u.km*const.c)**2).decompose()

        # Conversion factor for redshift, GM/Rc^2

        self.gmrc2 = (2.*const.G*const.M_sun/(const.c**2*u.km)).decompose()

        # MCU: this is a solution to load packaged data compatible
        # with python 3.6 - 3.10
        # however for python 3.10 and later this might become deprecated
        # alternative method is "from importlib.resources import files"
        # see https://setuptools.pypa.io/en/latest/userguide/datafiles.html

        data_path = os.path.join(os.path.dirname(__file__), 'data')
        print("data_path = " + data_path)

        # Only want to set the default values if both obsname and burstname
        # are not set (indicating a default run). This because setting
        # obsname=None is also how we indicate an "ensemble" mode run
        if (obsname is None) & (burstname is None):
            obsname = os.path.join(data_path, '1808_obs.txt')

        if run_id is None:
            run_id = os.path.join(data_path, '1808/test1')

        if burstname is None:
            burstname = os.path.join(data_path, '1808_bursts.txt')

        # apply the keyword values or defaults

        self.run_id = run_id
        self.obsname = obsname
        self.burstname = burstname
        self.gtiname = gtiname
        self.ref_ind = ref_ind
        self.bc = bc

        self.theta = theta
        self.stretch_a = stretch_a
        self.numburstssim = numburstssim
        self.lnprior = prior
        self.corr = corr
        self.nwalkers = nwalkers
        self.nsteps = nsteps
        self.threads = threads

        self.cmpr_fluen = fluen
        self.cmpr_alpha = alpha

        # check for the config_file, and if detected read in (will
        # override the defaults above):

        config_file_exists = None
        if (config_file is not None):
            if (os.path.exists(config_file)):
                config_file_exists = True
                cmpr_alpha, cmpr_fluen = True, True
                print ('Reading run params from {} ...'.format(config_file))
                self.read_config(config_file)
                print ("...done")
                # special here for the alpha and fluen parameters, which
		# are replaced by the actual data values (if the option is
		# True); (pre-v2.10 config files don't list alpha or fluen)
                if hasattr(self, 'alpha'):
                    self.cmpr_alpha = self.alpha
                    alpha = self.alpha
                if hasattr(self, 'fluen'):
                    self.cmpr_fluen = self.fluen
                    fluen = self.fluen
            else:
                print ('\n** ERROR ** config file not found, applying keywords\n')
                config_file_exists = False

        # Some checks here

        if alpha and (not fluen):
            print ('** ERROR ** need to include fluences as well as alphas')
            return

        if self.lnprior(self.theta) == -np.inf:
            print ('** ERROR ** supplied parameter vector is excluded by the prior')
            return

        # below set the parameters which are not part of the config
        # file

        self.restart = restart

        # number of dimensions for the parameter array
        # we want to record whether we're including systematic errors
        # here; previously this was via the (boolean) has_systematic

        self.ndim = len(self.theta)
        if (self.ndim < 6) | (self.ndim > 10):
            print ('** ERROR ** number of dimensions of input parameter vector should be 6-10')
            return
        self.num_systematic = self.ndim-8
        if ((self.ndim == 9) & (not self.cmpr_fluen)) | \
            ((self.ndim == 10) & (not (self.cmpr_alpha and self.cmpr_fluen))):
            print ("\n** WARNING ** systematic errors are provided for ignored quantities!")

        self.gti_checking = self.gtiname is not None

        # determines whether will run as a train of bursts or non-contiguous
        # bursts ("ensemble" mode); previously numerical, default is 1 (True),
        # which means a burst train will be generated; set obsname=None for
        # non-contiguous (ensemble mode) run

        self.train = (self.obsname is not None)

        self.bstart_err = BSTART_ERR.to('d').value
        self.M_NS = M_NS
        self.R_NS = R_NS

        self.matches = None

        # Read in all the measurements and set up all the parameters
        # This function now operates on the Beans object directly, and the
        # required attributes:
        # x, y, yerr, tref, bstart, pflux, pfluxe, tobs, fluen, fluen_err,
        #     st, et
        # are set in that routine
        # bypasses the earlier init function, and instead calls get_obs
        # directly

        get_obs(self, alpha=alpha, fluen=fluen)

        # Set interpolation mode, and define averaging function

        if not hasattr(self, 'interp'):
            self.interp = interp
        assert self.interp in ('linear','spline')
        if self.interp == 'linear':
            self.a, self.b = get_a_b(self.pflux, self.pfluxe, self.tobs)
            self.mean_flux = mean_flux_linear
        else:
            if not hasattr(self, 'smooth'):
                self.smooth = smooth
            self.tck_s = splrep(self.tobs, self.pflux, s=self.smooth)
            self.mean_flux = mean_flux_spline

        # # -------------------------------------------------------------------------#
        # # TEST THE MODEL WORKS
        # # -------------------------------------------------------------------------#
        print("# ---------------------------------------------------------------------------#")
        print("Doing Initialisation..")

        if test_model:

            print("Testing the model works..")


            test, valid, test2 = runmodel(self.theta, self, debug=False) # set debug to True for testing
            print("result: ", test, valid)

            # MCU Note: commented out - no interactive windows for automated testing
            # self.plot_model(test2)


    def __str__(self):
        """
        Show the parameters that the code has been intialised with
        For restart runs could include the number of steps that has
        already been done
        """

        return """== beans dataset =============================================================
See https://beans-7.readthedocs.io

Run ID: {}
Observation data file: {}
  bolometric correction: {}
GTI data file: {}
Burst data file: {}
  comprising {} observed bursts, {}including alphas{}{}
No. of bursts to simulate: {} ({} mode)
  with {} walkers, {} steps, {} threads{}, a={}
Initial parameters:
{}
==============================================================================""".format(self.run_id, self.obsname, self.bc, self.gtiname, self.burstname,
            self.numburstsobs,
            '' if self.cmpr_alpha else 'not ',
            '' if self.cmpr_fluen else ' or fluences',
            '' if self.obsname is None else ', ref. to #{}'.format(self.ref_ind),
            self.train+self.numburstssim*(1+self.train),
            'train' if self.train else 'ensemble',
            self.nwalkers, self.nsteps,
            self.threads,
            ', resuming' if self.restart else '', self.stretch_a,
            self.theta_table(self.theta, indent=2) )


    def theta_table(self, theta, indent=0):
        """
        Format the run parameter vector as a table
        Could include the errors for a neatly formatted way to present
        results

        :param theta: the model parameter tuple, with *X*, *Z*, *Q_b*, *d*,
          *xi_b*, *xi_p*, *mass*, *radius*, and (optionally) *f_E* & *f_a*
        :param indent: number of characters to indent the string from the left
        """

        X, Z, Q_b, dist, xi_b, xi_p, *extra = theta
        mass, radius, f_E, f_a = extra+[self.M_NS, self.R_NS, 1.0, 1.0][len(extra):]

        result = """#X = {:.3f} \\ hydrogen mass fraction
#Z = {:.5f} \\ CNO mass fraction
#Q_b = {:.3f} \\ base flux [MeV/nucleon]
#d = {:.2f} kpc \\ source distance
#xi_b = {:.3f} \\ anisotropy factor for burst emission
#xi_p = {:.3f} \\ anisotropy factor for persistent emission""".format(
    X, Z, Q_b, dist, xi_b, xi_p)
        result = result+"\n#M_NS = {:.3f} M_sun \\ neutron star mass".format(mass)
        if len(theta) <= 6:
            result += ' (fixed)'
        result = result+"\n#R_NS = {:.3f} km \\ neutron star radius".format(radius)
        if len(theta) <= 7:
            result += ' (fixed)'
        if self.num_systematic == 1:
            return (result+"""
#f_E = {:.3f} \\ systematic error term for fluence""".format(
    f_E)).replace('#',' '*indent)
        elif self.num_systematic == 2:
            return (result+"""
#f_E, f_a = {:.3f}, {:.3f} \\ systematic error terms for fluence, alpha""".format(
    f_E, f_a)).replace('#',' '*indent)

        return result.replace('#', ' '*indent)


    def mdot_Edd(self, X, radius):
        """
        Calculate the Eddington accretion rate (per unit area) as used
        by Settle, for converting to physical units. The Eddington rate is
        (1.75*(1.7/(1+G.X))*(1e-8)*(5.01837638e24))/(G.R*G.R)
        (settle.cc, line 131) where G.X is the hydrogen mass fraction, and
        G.R is the radius in cm; the constant is  M_sun/(4*365.25×86400)
        (i.e. the conversion of  M_sun /yr to g/s) to better than 1 part
        in 1000) in the NS frame

        :param X: accreted H-fraction
        :param radius: NS radius (km)

        :return: accretion rate in g/cm^2/s
        """

        return (1.75e-8*1.7/(1+X)*5.01837638e24)/(radius*1e5)**2 * u.g/u.cm**2/u.s


    def save_config(self, file=None, clobber=True):
        """
        Routine to write all the configuration parameters to a file, as a
        record of the run; but also to more easily replicate or continue
        a run. List of all the parameters saved to the configuration file:
        ``run_id``, ``obsname``, ``burstname``, ``gtiname``, ``alpha``,
        ``fluen``, ``ref_ind``, ``bc``, ``interp``, ``smooth``, ``theta``,
        ``numburstssim``, ``prior``, ``nwalkers``, ``nsteps``, ``threads``

        :param file: name of file to save the config as. If None, the run_id
          will be used as a prefix
        :param clobber: set to True to overwrite any existing file
        """

        if file is None:
            file = self.run_id+'.ini'

        if (not clobber) and (os.path.isfile(file)):
            print ('** ERROR ** config file already exists, skipping write')
            return
        else:
           cfgfile = open(file, "w")

           Config = ConfigParser()
           Config.add_section("beans")
           Config.set("beans", "run_id", self.run_id)
           Config.set("beans", "version", __version__)

           Config.add_section("data")
           Config.set("data", "obsname", str(self.obsname))
           Config.set("data", "burstname", self.burstname)
           Config.set("data", "gtiname", str(self.gtiname))
           Config.set("data", "alpha", str(self.cmpr_alpha))
           Config.set("data", "fluen", str(self.cmpr_fluen))

           if self.obsname is not None:
               # These parameters only used for "train" mode
               Config.set("data", "tref", str(self.tref))
               Config.set("data", "ref_ind", str(self.ref_ind))
               Config.set("data", "bc", str(self.bc))
               Config.set("data", "interp", str(self.interp))
               if self.interp == 'spline':
                   Config.set("data", "smooth", str(self.smooth))

           Config.add_section("emcee")
           Config.set("emcee", "theta", str(self.theta))
           Config.set("emcee", "stretch_a", str(self.stretch_a))
           Config.set("emcee", "numburstssim", str(self.numburstssim))
           Config.set("emcee", "prior", str(self.lnprior))
           Config.set("emcee", "corr", str(self.corr))
           Config.set("emcee", "nwalkers", str(self.nwalkers))
           Config.set("emcee", "nsteps", str(self.nsteps))
           Config.set("emcee", "threads", str(self.threads))

           Config.write(cfgfile)
           cfgfile.close()


    def read_config(self, file=None):
        """
        Routine to read all the configuration parameters from a file, to
        more easily replicate or continue a run

        :param file: name of file to read the config from.
        """

        if file is None:
            data_path = os.path.join(os.path.dirname(__file__), 'data')
            run_id = os.path.join(data_path, 'beans.ini')

        int_params = ('ref_ind','numburstssim','nwalkers','nsteps','threads')
        float_params = ('bc', 'smooth', 'tref', 'stretch_a')

        if not os.path.isfile(file):
            print ('** ERROR ** config file not found')
            return

        config = ConfigParser(allow_no_value=True)
        config.read(file)

        # Loop over sections, attributes

        for section in config.sections():
            # print("Section: %s" % section)
            for option in config.options(section):
                # print(
                #     "x %s:::%s:::%s"
                #     % (option, config.get(section, option), str(type(option))))
                if option == 'theta':
                    setattr(self, option,
                        tuple(map(float, config.get(section, option)[1:-1].split(', '))))
                elif option in float_params:
                    setattr(self, option, config.getfloat(section, option))
                elif (option == 'prior'):
                    function_name = config.get(section, option).split(' ')[1]
                    if (option == 'prior') & (function_name != str(self.lnprior).split(' ')[1]):
                        print ('''
** WARNING ** config file lists the prior function as {},
                but supplied prior is {}
              To fully replicate the previous run you need to specify the
                same prior using the prior=beans.{} flag on init
'''.format(function_name, str(self.lnprior).split(' ')[1], function_name))
                elif (option == 'corr'):
                    function_name = config.get(section, option)
                    if function_name != 'None':
                        function_name = function_name.split(' ')[1]
                    _scorr = str(self.corr)
                    if _scorr != 'None':
                        _scorr = _scorr.split(' ')[1]
                    if (function_name != _scorr):
                        print ('''
** WARNING ** config file lists {} for the correction,
                but supplied value is {}
              To fully replicate the previous run you need to specify the
                same option/condition using the corr=beans.{} flag on init
'''.format(function_name, _scorr, function_name))
                elif option in int_params:
                    setattr(self, option, config.getint(section, option))
                else:
                    # string options (including "None")
                    _value = config.get(section, option)
                    if _value == 'None':
                        setattr(self, option, None)
                    elif _value == 'True':
                        setattr(self, option, True)
                    elif _value == 'False':
                        setattr(self, option, False)
                    else:
                        setattr(self, option, _value)


    def flux_to_mdot(self, X, dist, xi_p, mass, radius, flux=None):
        """
        Function to convert fluxes to accretion rate, in units of the
        Eddington rate, calculated using the mdot_Edd function

        This routine uses the precise calculation of Q_grav, i.e.  c^2z/(1+z)

        :param X: accreted H-fraction
        :param dist: source distance (kpc)
        :param xi_p: anisotropy of persistent emission
        :param mass: NS mass (M_sun)
        :param radius: NS radius (km)
        :param flux: flux value or array to convert. If None, then we just
          return the observed persistent flux and error

        :return: mdot, mdot_err OR individual flux values
        """

        if flux is None:
            return self.flux_to_mdot(X, dist, xi_p, mass, radius, self.pflux), \
                self.flux_to_mdot(X, dist, xi_p, mass, radius, self.pfluxe)

        opz = 1./(np.sqrt(1.-self.gmrc2*mass/radius))

        return (self.r1*flux*self.bc*dist**2*xi_p*opz**2
            / (radius**2*(opz-1)) / self.mdot_Edd(X, radius) ).decompose().value


    def lnlike(self, theta_in, x, y, yerr, components=False):
        """
        Calculate the "model" likelihood for the current walker position
        Calls runmodel which actually runs the model, either generating a
        burst train, or a set of runs for "ensemble" mode. Then extracts the
        relevant model outputs and calculates the likelihood.

        :param theta_in: parameter vector, with *X*, *Z*, *Q_b*, *d*, *xi_b*,
          *xi_p*, *mass*, *radius*, and (optionally) *f_E* & *f_a*
        :param x: the "independent" variable, passed to lnlike
        :param y: the "dependent" variable (i.e. measurements), passed to lnlike
        :param yerr: erorr estimates on y

        :return: likelihood, model result array
        """

        # define theta_in = model parameters, which we define priors for

        X, Z, Q_b, dist, xi_b, xi_p, *extra = theta_in
        mass, radius, f_E, f_a = extra+[self.M_NS, self.R_NS, 1.0, 1.0][len(extra):]

        # call model (function runmodel, in run_model.py) to generate the burst
        # train, or the set of bursts (for "ensemble" mode. In earlier versions
        # the corresponding IDL function was defined as
        # modeldata(base, z, x, r1, r2 ,r3)

        assert np.allclose(y, self.y)
        model, valid, model2 = runmodel( theta_in, self)
        if not valid:
            return -np.inf, model

        # To simplify final likelihood expression we define inv_sigma2 for each
        # data parameter that describe the error.  The variance (eg sEb0) is
        # underestimated by some fractional amount, f, for each set of
        # parameters.

        ato = int(self.train) # array "train" offset
        err_fac = np.concatenate(( np.full(self.numburstsobs-ato,1.),
            np.full(self.numburstsobs,f_E), np.full(self.numburstsobs-ato,f_a)))
        inv_sigma2 = 1./(yerr[:self.ly]*err_fac[:self.ly])**2

        # Final likelihood expression
        # Because the y (observed value) vector may or may not include the
        # alpha values, we need to truncate the other vectors here

        # cpts = (self.y - (model)) ** 2 * inv_sigma2 - (np.log(inv_sigma2))
        cpts = (self.y - model[:self.ly]) ** 2 * inv_sigma2 - (np.log(inv_sigma2))

        # if the components flag is set, also add those to the model dict

        if components:
            model2['cpts'] = cpts

        # Test if the result string is defined here. It is, so we return the selected elements of result
        # instead of the downselection in model

        # Now also return the model
        return -0.5 * np.sum(cpts), model2


    # -------------------------------------------------------------------------#
    # Finally we combine the likelihood and prior into the overall lnprob function, called by emcee

    # define lnprob, which is the full log-probability function
[docs]    def lnprob(self, theta_in, x, y, yerr):
        """
        The full log-probability function incorporating the priors (via
        the ``Beans.lnprior`` attribute), and model likelihood (via
        :meth:`Beans.lnlike`), that is passed to ``runemcee`` when creating
        the sampler (in the :meth:`Beans.do_run` method).

        :param theta_in: parameter vector, with *X*, *Z*, *Q_b*, *d*, *xi_b*,
          *xi_p*, *mass*, *radius*, and (optionally) *f_E* & *f_a*
        :param x: the "independent" variable, passed to :meth:`Beans.lnlike`
        :param y: the "dependent" variable (i.e. measurements), passed to
          :meth:`Beans.lnlike`
        :param yerr: erorr estimates on y
        :return: total (prior+model) likelihood, prior likelihood, model array
          (from :meth:`Beans.lnlike`)
        """

        lp = self.lnprior(theta_in)
        # Check if the parameters are consistent with the prior, and skip
        # the model run it if not
        if (not np.isfinite(lp)):
            return -np.inf, -np.inf, None

        # Now also returns the model, to accumulate along with the likelihoods

        like, model = self.lnlike(theta_in, x, y, yerr)

        if (not np.isfinite(like)):
            return -np.inf, -np.inf, model

        # encoding below is so we have a suitable object for including in
        # the blobs (see the dtype specification in runemcee)

        return lp + like, lp, model_str(model).encode('ASCII')


[docs]    def plot(self, show_model=True, model=None, mdot=True, title=None, 
        savefig=False):
        """
	Display a plot of the data and model results, for a burst train
        calculated with generate_burst_train Adapted from the example at
        https://matplotlib.org/gallery/api/two_scales.html

        :param show_model: set to False to skip the model generation step, in which case only the observed data will be plotted
        :param model: array of packed model prediction, OR dict giving full model results
        :param mdot: flag to show mdot rather than flux (only possible if you're passing the full model)
        :param title: add a title, if required
        :param savefig: set to True to save the figure to PDF
        """

        flux_colour = 'tab:red'
        bursts_colour = 'tab:blue'
        obs_colour = 'tab:grey'

        # for the default linear interpolation connect the flux
        # measurements by lines

        ls = '-'
        if self.interp == 'spline':
            ls = ''

        X, Z, Q_b, dist, xi_b, xi_p, *extra = self.theta
        mass, radius, f_E, f_a = extra+[self.M_NS, self.R_NS, 1.0, 1.0][len(extra):]

        imatch = None
        if (model is None) & show_model:
            # no need to do the matching here
            test, valid, model = runmodel(self.theta, self, match=False,
                debug=False)

            # ... but it's useful to know if it's possible

            imatch = burst_time_match(self.ref_ind, self.bstart,
                model['iref'], np.array(model['time']))

            if imatch is None:
                print ("\n** WARNING ** can't match predicted bursts to observations")

        full_model = False  # Flag to remember whether we're plotting the
                            # full model output of generate burst train or
                            # the packed output array
        if type(model) == dict:
            full_model = True
            timepred = model["time"]
            if (len(timepred) == 0): # | (not valid):
                print ('** ERROR ** no predicted times to show')
                show_model = False
            else:
                ebpred = np.array(model["fluen"])
        elif type(model) == list:
            breakpoint()
	    # The other way to return the model is as an array with the
	    # burst times, fluences and alphas all together. So unpack
	    # those here
            timepred = model[:self.numburstssim+1]
            ebpred = np.array(model[self.numburstssim+int(self.train):self.numburstssim*2+int(self.train)]) * self.fluen_fac/xi_b/dist**2

        # Now set up the figure

        if show_model & (imatch is not None):
            fig, axs = plt.subplot_mosaic([['main'],['main'],['resid']])
            ax1 = axs['main']
        else:
            fig, ax1 = plt.subplots()
        # fig.figure(figsize=(10,7))

        ax2 = ax1.twinx()  # instantiate a second axes that shares the same x-axis
        if self.gti_checking:
            #plot satellite gtis
            for i in range(1,len(self.st)):
                ax1.axvspan(self.st[i],self.et[i],facecolor='0.5', alpha=0.2)
            ax1.axvspan(self.st[0],self.et[0], facecolor='0.5',alpha=0.2,label='Satellite GTIs')

        # first show the flux/mdot
        if mdot and full_model:
            # this is the usual (only?) plot style, showing mdot vs. time,
            # along with the burst model and observation comparison
            _mdot, _mdot_err = self.flux_to_mdot(X, dist, xi_p, mass, radius)
            ax1.set_ylabel('Accretion rate (fraction of Eddington)', color=flux_colour)
            if self.train:
                # show the burst train
                ax1.errorbar(self.tobs, _mdot, _mdot_err,
                    marker='.', ls=ls, color=flux_colour, label='mdot')
                if self.interp == 'spline':
                    t = np.arange(min(self.tobs), max(self.tobs), 0.1)
                    ax1.plot(t, self.flux_to_mdot(X, dist, xi_p, mass, radius,
                        BSpline(*self.tck_s)(t)), color=flux_colour)
                # show the time of the "reference" burst
                # ax2.axvline(timepred[self.iref], c='k')
                ax2.axvline(self.bstart[self.ref_ind], c='k', ls='--')
            else:
                # show the ensemble comparison, which is much simpler
                ax1.errorbar(self.bstart, _mdot, _mdot_err, fmt='.',
                         color=flux_colour, label='mdot')
        else:
            ax1.set_ylabel('Persistent flux ($10^{-9}\\,{\\rm erg\\,cm^{-2}\\,s^{-1}}$)', color=flux_colour)
            if self.train:
                ax1.errorbar(self.tobs, self.pflux, self.pfluxe,
                    marker = '.', ls=ls, color=flux_colour, label = 'persistent flux')
                if self.interp == 'spline':
                    t = np.arange(min(self.tobs), max(self.tobs), 0.1)
                    ax1.plot(t, BSpline(*self.tck_s)(t), color=flux_colour)
                if show_model:
                    ax2.scatter(timepred[0], ebpred[0], marker = '*',color=bursts_colour,s = 100)
                ax1.set_xlabel("Time (days after MJD {})".format(self.tref))
            else:
                # "ensemble" mode plot vs. epoch, rather than observation time
                ax1.errorbar(self.bstart, self.pflux, self.pfluxe, fmt='.', color=flux_colour,
                         label='persistent flux')
                ax1.set_xlabel("Epoch (MJD)")

        ax1.tick_params(axis='y', labelcolor=flux_colour)

        # Plot the bursts here
        ax2.set_ylabel("Fluence ($10^{-6}\\,{\\rm erg\\,cm^{-2}}$)", color=obs_colour)
        if self.train:
            if self.bstart is not None:
                # Plot the observed bursts, if available
                # ax2.scatter(tobs,ebobs, color = 'darkgrey', marker = '.', label='observed', s =200)
                ax2.errorbar(self.bstart[self.ifluen], self.fluen[self.ifluen],
                    yerr=self.fluene[self.ifluen],
                    color=obs_colour, linestyle='', marker='.', ms=13,
                    label='observed bursts')
                for i in range(self.numburstsobs):
                    if (i not in self.ifluen) & (i != self.ref_ind):
                        ax2.axvline(self.bstart[i], color=obs_colour, ls='--')

            if show_model:
                ax2.scatter(timepred[1:], ebpred, marker = '*',color=bursts_colour,s = 100, label = 'predicted bursts')
            # we have time but not fluence for the first burst
                ax2.axvline(timepred[0], color=bursts_colour, ls='--')
                # and the averaged mdot over the burst interval (predicted)
                av_mdot = []
                for i in range(len(timepred)-1):
                    av_mdot.append(self.flux_to_mdot(X, dist, xi_p, mass, radius,
                        self.mean_flux(timepred[i], timepred[i+1], self)))
                av_mdot.insert(0, av_mdot[0])
                ax1.step(timepred, av_mdot, where='pre', color=flux_colour)

                if imatch is not None:
                    # show the burst time comparison
                    resid = -(self.bstart-np.array(timepred)[imatch])*24.
                    axs['resid'].plot(imatch, resid,
                        linestyle='', marker='.', ms=13, color=obs_colour)
                    for i in range(self.numburstsobs):
                        axs['resid'].annotate(' {}'.format(i+1), 
                            (imatch[i], resid[i]) )
                    axs['resid'].axhline(0.0, color=obs_colour, ls='--')
                    axs['resid'].set_xlabel('Burst number (predicted)')
                    axs['resid'].set_ylabel('Time offset (hr)')
                    print ('RMS obs-model offset = {:.4f} hr'.format(
                        np.sqrt(np.mean(resid**2))))

        else:
            ax2.scatter(self.bstart,ebobs, color = 'darkgrey', marker = '.', label='observed', s =200)
            if show_model:
                ax2.scatter(self.bstart, ebpred, marker = '*',color=bursts_colour,s = 100, label = 'predicted')

        ax2.tick_params(axis='y', labelcolor=obs_colour)

        ax1.set_xlabel("Time (days after MJD {})".format(self.tref))
        if title is not None:
            plt.title(title)

        fig.tight_layout()  # otherwise the right y-label is slightly clipped

        fig.legend(loc=1)

        if savefig:
            file = f'{self.run_id}_plot.pdf'
            print ('Saving figure plot to {}'.format(file))
            fig.savefig(file)

        fig.show()

[docs]    def sim_data(self, file=None):
        """
        This method generates a table of simulated data based on the
        current theta vector, that can be used for tests of the MCMC
        method

        Errors are taken as the mean of the observational errors; bursts
        matching observed bursts (according to the matching algorithm)
        are flagged as ``True`` in the 6th column

        In lieu of an output file, you can just paste the results into a
        text file and use as the input (specify as ``burstname``)

        :param file: file to save the results to (not yet implemented)

        :return:
        """

        print ("Generating simulated data based on parameter vector\n  theta={}:".format(self.theta))

        X, Z, Q_b, dist, xi_b, xi_p, *extra = self.theta
        mass, radius, f_E, f_a = extra+[self.M_NS, self.R_NS, 1.0, 1.0][len(extra):]

        opz = 1./(np.sqrt(1.-self.gmrc2*mass/radius))
        print ('  i.e. source at d={:.2f} kpc, xi_b={:.4f}, xi_p={:.4f}, X={:.2f}, Z={:.3f}, M_NS={:.2f}, R_NS={:.2f}, 1+z={:.3f}, Q_b={:.2f}'.format(
            dist,  xi_b, xi_p, X, Z, mass, radius, opz, Q_b))
        if self.obsname is not None:
            print ('  persistent fluxes from {}, interp={}, bc={}\n'.format(
                self.obsname, self.interp, self.bc))

        test, valid, full_model = runmodel(self.theta, self)

        if self.train:
            for i in range(len(full_model['time'])):
                if i == 0:
                    print('{:.5f}	{:.4f}	{:.4f}	{:.1f}	{:.1f}	{}'.format(full_model['time'][0]+self.tref, full_model['fluen'][0],np.mean(self.fluene),0.,0.,str(i in full_model['imatch'])))
                else:
                    print('{:.5f}	{:.4f}	{:.4f}	{:.1f}	{:.1f}	{}'.format(full_model['time'][i]+self.tref, full_model['fluen'][i-1],np.mean(self.fluene),full_model['alpha'][i-1],np.mean(self.alphae[1:]),str(i in full_model['imatch'])))

        else:
            for i in range(len(self.bstart)):
                print('{:.5f}       {:.3f}      {:.3f}  {:.1f}  {:.1f}  {:.3f}  {:.3f}  {:.3f}  {:.3f}'.format(
                    self.bstart[i], self.fluen[i], self.fluene[i],
                    self.alpha[i],self.alphae[i],self.pflux[i],
                    self.pfluxe[i],self.tdel[i],self.tdele[i]))

    # -------------------------------------------------------------- #

    def distance_limit(self, distrange=[1,10], Xmin= 0.01, gridsize=10, numtrains=100, skiplo=True):
        """
        Generate burst trains and test how many of them are consistent with the GTIs
        """

        assert len(distrange) == 2

        X_0, Z, Q_b, dist, xi_b, xi_p, *extra = self.theta
        mass, radius, f_E, f_a = extra+[self.M_NS, self.R_NS, 1.0, 1.0][len(extra):]

        # Loop over the distance values

        distance = np.linspace(distrange[0], distrange[1], gridsize)
        X = np.linspace(Xmin, 0.7, gridsize)
        idist = cd.iso_dist(nsamp=gridsize)
        xi_b, xi_p = cd.anisotropy(idist)

        # initialise the array to keep to grid results

        result = np.zeros((gridsize, gridsize))

        for i, _distance in enumerate(distance):

            # For each distance, loop over the h-fraction range
            for j, _X in enumerate(X):

                # initialise result array
                valid_array = []

                print('Drawing one of {} values for xi_p:'.format(len(xi_p.distribution)))
                # For each distance and h-fraction, draw a bunch of inclination values and xi_p's:
                for _xi_p in xi_p.distribution:

                    r1 = _xi_p.value*(_distance/10)**2
                    theta_1 = (_X, Z, Q_b, f_a, f_E, r1, r2, r3, mass, radius)

                    # Run for just one burst to get the initial interval
                    # Set ref_ind to be zero, will subsequently distribute the start burst times
                    # between up to the simulated interval
                    test, valid, result = runmodel(theta_1, self.y, 0.0, self.bstart,
                                           self.pflux, self.pfluxe, self.tobs, 1,1, 0.0,
                                           0, self.train, debug=False)
                    print("result: ", test, valid)
                    # self.plot_model(test)

                    # find the initial range of start times to distribute the bursts over

                    if (test is not None) & (len(test['time']) > 1):
                        # iref = np.argmin(abs(np.array(test['time'])-self.tref))
                        iref = np.argmin(abs(np.array(test['time'])))
                        intvl = test['time'][iref+1]
                    else:
                        # If we can't get an initial burst train, distribute the start times
                        # over the entire outburst
                        intvl = max(self.tobs)
                    # This piece of code is probably redundant now that next_burst checks for
                    # predicted burst times beyond tobs
                    if (intvl > 2.*max(self.tobs)) and skiplo:
                        print ('Skipping trials with d={:.4f} and X={:.4f} due to excessive tdel {} >> {}'.format(
                            _distance, _X, intvl, max(self.tobs) ))
                        valid_array.append(True)
                    else:
                        # intvl = min([test['time'][iref+1], max(self.tobs)])

                        trials = np.linspace(0., intvl, numtrains)
                        print ('Simulating {} trains with reference burst distributed within (0, {:.3f})'.format(numtrains, intvl))

                        for trial in trials:

                            print ('trial {:.4f}:'.format(trial))
                            # Set nburstssim to 100 below, just need to make sure it's sufficient to cover
                            # the whole outburst. Replace ref_ind with trial, as the starting burst time
                            # (ref_ind is meaningless if there's no bursts)
                            test, valid, result = runmodel(theta_1, self.y, 0.0, self.bstart,
                                                   self.pflux, self.pfluxe, self.tobs, 100,100, trial,
                                                   1,self.train, gti_start=self.st, gti_end=self.et, debug=False)

                            # for debugging
                            # self.plot_model(test)
                            # breakpoint()

                            valid_array.append(valid)
                            print ('  valid={}'.format(valid))


                result[i,j] = len(np.where(valid_array)[0])/len(valid_array)
                print ('End of loop for d={}, X={}, % valid is {}'.format(
                    _distance, _X, 100*result[i,j] ))

        breakpoint()

    # -------------------------------------------------------------- #

[docs]    def do_run(self, plot=False, analyse=True, burnin=2000, **kwargs):
        """
        This routine runs the chain for as many steps as is specified in
        the init call.  Emcee parameters are defined in runemcee module.
        Have previously used multiprocessing to speed things up, but that's
        not currently active

        :param plot: set to True to do the plot of the initial guess. This
          seems redundant since it's also plotted at the __init__ stage
        :param analyse: set to True to call do_analysis automatically once the
          chains finish
        :param burnin: number of steps to ignore at the start of the run,
          passed to do_analysis

        :return:
        """

        # Check here if we've already run the analysis

        if hasattr(self, 'reader'):
            print ('''
** WARNING ** re-running the sampler after calling do_analysis can lead to
                memory issues; proceed with caution!''')
            value = input('              Press [RETURN] to continue: ')

        # Check the number of threads here

        ncpu = cpu_count()
        if self.threads > ncpu:
            print ('** ERROR ** number of threads is greater than number of CPUs ({} > {}); this seems ill-advised'.format(self.threads, ncpu))
            return

        # Want to avoid overwriting existing log & config files

        if (self.restart is False) and (os.path.exists(self.run_id+'.h5')):
            print ('\n** ERROR ** run will overwrite existing log file {}, set restart=True to extend'.format(self.run_id+'.h5'))
            return

        if (os.path.exists(self.run_id+'.ini')):
            print ('\n** WARNING ** run will overwrite existing config file {}'.format(self.run_id+'.ini'))
            value = input('              enter Y[RETURN] to continue: ')
            if (value != 'y') and (value != 'Y'):
                print ('do_run terminated')
                return
        self.save_config(clobber=True)

        print("# ---------------------------------------------------------------------------#")
        print (self)
        print("# ---------------------------------------------------------------------------#")
        # Testing the various functions. Each of these will display the likelihood value, followed by the model-results "blob"
        print("Testing the prior and likelihood functions..")
        print("lnprior:", self.lnprior(self.theta))
        print("lnlike:", self.lnlike(self.theta, None, self.y, self.yerr))
        print("lnprob:", self.lnprob(self.theta, None, self.y, self.yerr))
        print("# ---------------------------------------------------------------------------#")

        # for supplied positions, you want to check that they are all
        # valid

        if 'pos' in kwargs:

            # now also has the option to read in the positions from a
            # pickle file

            if type(kwargs['pos']) == str:
                print ('\nReading in positions from file {}...'.format(kwargs['pos']))
                new_pos = pickle.load(open(kwargs['pos'],'rb'))
                print ('... done')
            else:
                new_pos = kwargs['pos'].copy()

            if np.shape(new_pos) != (self.nwalkers, self.ndim):
                print ('** ERROR ** supplied positions has wrong dimensions; {} != {}'.format(np.shape(new_pos), (self.nwalkers, self.ndim)))
                return None

            print ('\n** WARNING ** walkers will start at provided position vector.\n              Checking supplied positions...')
            # assert len(kwargs['pos']) == self.nwalkers
            bad = np.full(len(new_pos), False)
            for i, pos in enumerate(new_pos):
                _test, _valid, _model = runmodel(pos, self)
                bad[i] = _test is None
            nbad = len(np.where(bad)[0])

            if nbad == 0:
                print ('... done. all OK, continuing')
            else:
                print ('... done. {}/{} positions invalid; redistributing...'.format(nbad, self.nwalkers))
                # if you have too many bad positions, you'll get an error
                # running with too many duplicates; need to possibly trap that
                # here
                for i in (np.where(bad)[0]):
                    new_pos[i] = kwargs['pos'][np.random.choice(np.where(~bad)[0])] #+ scale*np.random.randn(ndim)
                print ('... done')

            kwargs['pos'] = new_pos

        if plot:
            print("plotting the initial guess.. (you want the predicted bursts to match approximately the observed bursts here)")
            # make plot of observed burst comparison with predicted bursts:
            self.plot(title='Initial guess of parameters')
            value = input('Press [RETURN] to continue: ')

        _start = time.time()

        # run the chains and save the output as a h5 file
        # TODO to simplify the subsequent analysis I think this object
        # should be added to the Beans object
        sampler = runemcee(self.nwalkers, self.nsteps,
            self.theta, self.lnprob, self.lnprior, None, self.y, self.yerr,
            self.run_id, self.restart, self.threads, self.stretch_a, **kwargs)

        _end = time.time()
        print ("  run_id {} took {:.1f} seconds for {} steps".format(
            self.run_id, _end-_start, self.nsteps))

        if analyse:
            print ("\nRunning analses with do_analysis...")
            self.do_analysis(burnin=burnin)
        #if self.restart == False:
            #sampler.reset()

# -------------------------------------------------------------------------#

    def plot_autocorr(self, samples=None, reader=None, savefile=None, figsize=(8,5) ):
        """
        This method shows the estimated autocorrelation time for the run
        Extracted from do_analysis, and originally based on the analysis
        described in the example for emcee:
        https://emcee.readthedocs.io/en/stable/tutorials/autocorr

        :param samples: numpy array with samples, to calculate the
          autocorrelation from
        :param reader: object to get the chains from (if not supplied via
	  the samples parameter), via the get_chain method. TODO just pass
          the samples to make this more general
        :param savefile: name of file to save as (skip if None)
        :param figsize: size for the figure, (tuple, in inches)

        :return:
        """

        def next_pow_two(n):
            i = 1
            while i < n:
                i = i << 1
            return i

        def autocorr_func_1d(x, norm=True):
            x = np.atleast_1d(x)
            if len(x.shape) != 1:
                raise ValueError("invalid dimensions for 1D autocorrelation function")
            n = next_pow_two(len(x))

            # Compute the FFT and then (from that) the auto-correlation function
            f = np.fft.fft(x - np.mean(x), n=2*n)
            acf = np.fft.ifft(f * np.conjugate(f))[:len(x)].real
            acf /= 4*n

            # Optionally normalize
            if norm:
                acf /= acf[0]

            return acf


        def auto_window(taus, c):
            """
            Automated windowing procedure following Sokal (1989)
            """

            m = np.arange(len(taus)) < c * taus
            if np.any(m):
                return np.argmin(m)
            return len(taus) - 1


        def autocorr_gw2010(y, c=5.0):
            """
            Following the suggestion from Goodman & Weare (2010)
            """

            f = autocorr_func_1d(np.mean(y, axis=0))
            taus = 2.0*np.cumsum(f)-1.0
            window = auto_window(taus, c)
            return taus[window]


        def autocorr_new(y, c=5.0):
            f = np.zeros(y.shape[1])
            for yy in y:
                f += autocorr_func_1d(yy)
            f /= len(y)
            taus = 2.0*np.cumsum(f)-1.0
            window = auto_window(taus, c)
            return taus[window]


        if (samples is None) and (reader is None):
            # load in sampler:
            print ('Loading reader from {}.h5...'.format(self.run_id))
            reader = emcee.backends.HDFBackend(filename=self.run_id+".h5")

        if reader is not None:
            samples = reader.get_chain(flat=False)
            #tau = 20
            tau = reader.get_autocorr_time(tol=0) #using tol=0 means we'll always get an estimate even if it isn't trustworthy.
            thin = int(0.5 * np.min(tau)) # seems to be ignored - dkg
            print(f"The autocorrelation time for each parameter as calculated by emcee is: {tau}")
            print ("  mean {:.1f}, min {:.1f}, max {:.1f}".format(np.mean(tau),
                min(tau), max(tau)))

        # alternate method of checking if the chains are converged:
        # This code is from https://dfm.io/posts/autocorr/

        # get autocorrelation time:

        # loop through 10 parameters and plot the evolution of the
        # autocorrelation time estimate for each

        f = plt.figure(figsize=figsize)

        param = ["$X$", "$Z$", "$Q_{\mathrm{b}}$", "$d$", "$\\xi_b$",
            "$\\xi_p$", "$M$", "$R$", "$f_{\mathrm{E}}$", "$f_{\mathrm{a}}$"]

        for j in range(self.ndim):
            chain = samples[:, :, j].T
            # print(np.shape(sampler))

            N = np.exp(np.linspace(np.log(100), np.log(chain.shape[1]), self.ndim)).astype(int)
            # print(N)
            gw2010 = np.empty(len(N))
            new = np.empty(len(N))
            for i, n in enumerate(N):
                gw2010[i] = autocorr_gw2010(chain[:, :n])
                new[i] = autocorr_new(chain[:, :n])

            # Plot the comparisons
            #plt.loglog(N, gw2010, "o-", label="G\&W 2010")
            plt.loglog(N, new, "o-", label=f"{param[j]}")
            plt.loglog(N, gw2010, "o-", label=None, color='grey')
            ylim = plt.gca().get_ylim()

            #plt.ylim(ylim)
        plt.xlabel("Number of samples, $N$", fontsize='xx-large')
        plt.ylabel(r"$\tau$ estimates",fontsize='xx-large')



        plt.plot(N, np.array(N)/50.0, "--k")# label=r"$\tau = N/50$")
        plt.legend(fontsize='large',loc='best',ncol=2) #bbox_to_anchor=(0.99, 1.02)
        plt.xticks(fontsize=14)
        plt.yticks(fontsize=14)
        if savefile is not None:
            print ('plot_autocorr: saving figure as {}'.format(savefile))
            plt.savefig(savefile)
        plt.show()


[docs]    def burst_table(self, show=True, predicted=False, key=None):
        """
	This method creates and, optionally, displays a table from the
        model and observed bursts.

        The table is returned as an astropy Table object that can be saved
        as an MRT file, like so: ``tab.write('test.dat',format='mrt')``
	although you will have to then edit the file afterwards to
        complete the metadata

        :param show: set to True to display each row (in LaTeX format)
        :param predicted: set to True to show predicted bursts also (not yet implemented)
        :param key: for the case where we have more than one set of predictions (e.g. for different numbers of predicted bursts), the key will identify which to return

        :return: astropy table of burst properties
        """

        def strmeas(val, err, err_hi=None):
            '''
            Function to return nicely (TeX) formatted measurements, with errors
            Adapted (and simplified) from strmeas.pro

            For simplicity we consider only the case where the error is smaller 
            than the value. Since the error and the value need to be
            plotted to the same digit, we have essentially just two cases: 
            integer and integer, or float and float
            
            :param val: central value (50th percentile or whatever)
            :param err: if err_hi is not supplied, this is the symmetric error; otherwise, the lower error
            :param err_hi: upper uncertainty
            
            :returns: formatted string
            '''
            
            eta=1e-20     # Threshold for non-zero measurements
            sym_templ = '${{{}}}\pm{{{}}}$'
            asym_templ = '${{{}}}_{{{{{{{}}}}}}}^{{{{{{{}}}}}}}$'
            
            # get the number of significant figures of each of the errors
            fudge=0.0222764
            n_lo, n_hi = -1, -1
            if abs(err) > eta:
                n_lo=np.floor(np.log10(abs(err))+fudge)
                
            if err_hi is None:
                err_hi = err

            if abs(err_hi) > eta:
                n_hi=np.floor(np.log10(abs(err_hi))+fudge)

            lmin = int(min([n_lo, n_hi]))
            if (err < 2.*10.**n_lo) | (err_hi < 2.*10.**n_hi):
                # need an extra significant figure if the leading digit is 1
                lmin -= 1

            if (lmin < 0):

                # Floating point value

                rtnfmt = ':.{}f'.format(-lmin)
                if np.allclose(round(err, -lmin), round(err_hi, -lmin)):
                    # symmetric errors
                    res = sym_templ.format(rtnfmt, rtnfmt).format(val, err)
                else: 
                    # asymmetric errors
                    errfmt = ':+.{}f'.format(-lmin)
                    res = asym_templ.format(rtnfmt, errfmt, errfmt).format(val, -err, err_hi)
            else:

                # Integer value

                rtnfmt=':d'
                # round the quantities and convert to integers
                ival = int(np.floor(val/10.**lmin+0.5)*10.**lmin)
                ierr_lo = int(np.floor(err/10.**lmin+0.5)*10**lmin)
                ierr_hi = int(np.floor(err_hi/10.**lmin+0.5)*10**lmin)
                if np.allclose(ierr_lo, ierr_hi):
                    # symmetric errors
                    res = sym_templ.format(rtnfmt, rtnfmt).format(ival, ierr_lo)
                else:
                    # asymmetric errors
                    errfmt = ':+d'
                    res = asym_templ.format(rtnfmt, errfmt, errfmt).format(ival, -ierr_lo, ierr_hi)


            return res


        if not self.HAS_CONCORD:
            print ('** ERROR ** alpha calculation requires concord')
            return None

        if not hasattr(self, 'model_pred'):
            print ('** ERROR ** no model predictions available, run the comparison first')
            return None

        if (key is None) & (len(self.model_pred['time_stats'].keys()) > 1):
            print ('** ERROR ** multiple solutions are available, please specify one with the key keyword')
            print (self.model_pred['time_stats'].keys())
            return None

        elif key is None:
            key = list(self.model_pred['time_stats'].keys())[0]

        timepred = [x[0] for x in self.model_pred['time_stats'][key]]
        ref_tpred = np.argmin(np.abs(self.bstart[self.ref_ind]-timepred))
        imatch = burst_time_match(self.ref_ind, self.bstart, ref_tpred, np.array(timepred))

        bursts = Table()
        bursts['num'] = np.arange(self.numburstsobs)+1
        bursts['num'].info.description = 'Burst number'
        bursts['minbar_id'] = np.full(self.numburstsobs, 9999) # filler
        bursts['minbar_id'].info.description = 'MINBAR DR1 ID'
        bursts['time'] = Time(self.bstart+self.tref, format='mjd') 
        # we can set this, but it doesn't seem to be written when output
        # as MRT
        bursts['time'].info.description = 'Burst start time'
        bursts['bfluen'] = MaskedColumn(self.fluen, mask=self.fluen <= 0.,
            unit=FLUEN_U, description='Integrated burst fluence')
        bursts['e_bfluen'] = MaskedColumn(self.fluene, mask=self.fluen <= 0.,
            unit=FLUEN_U, description='Error on burst fluence')
        bursts['alpha_obs'] = MaskedColumn(self.alpha, mask=self.alpha <=0., 
            description='Burst alpha-value')
        bursts['e_alpha_obs'] = MaskedColumn(self.alphae, mask=self.alpha <=0., 
            description='Error on alpha-value')

        # Now loop over the bursts and calculate the derived quantities
        dt, e_dt, alpha, e_alpha, E_alpha = [], [], [], [], []
        for i in np.arange(self.numburstsobs):
            if imatch[i] > 0: 
                if imatch[i]-imatch[i-1] == 1:
                    # no missed bursts
                    _dt = (self.bstart[i]-self.bstart[i-1])*24.
                    perflx = self.mean_flux(self.bstart[i-1], self.bstart[i], self)
                else:
                    # one or more missed bursts, so use the model predictions for the previous time
                    _dt = (self.bstart[i] - np.array(self.model_pred['times'])[:,imatch[i]-1]) * 24.
                    perflx = [self.mean_flux(x, self.bstart[i], self) for x in np.array(self.model_pred['times'])[:,imatch[i]-1]]
                _alpha = self.cd.alpha(_dt,(self.fluen[i], self.fluene[i]), perflx).value
                if np.shape(_dt) == ():
                    # scalar _dt, exact recurrence time
                    dt.append(_dt)
                    e_dt.append(0.)
                    if show:
                        print ("{} & [minbar ID] & {} & {:.2f} & {} & {} & {} \\\\".format(
                            bursts['num'][i], bursts['time'][i], dt[-1],
                            strmeas(bursts['bfluen'][i], bursts['e_bfluen'][i]),
                            strmeas(bursts['alpha_obs'][i], bursts['e_alpha_obs'][i]),
                            strmeas(_alpha[0], _alpha[1], _alpha[2])))
                else:
                    dt_stats = np.percentile(np.array(_dt), [16,50,84])
                    dt.append(dt_stats[1])
                    e_dt.append((dt_stats[2]-dt_stats[0])*0.5)
                    if show:
                        print ("{} & [minbar ID] & {} & {} & {} & {} & {} \\\\".format(
                            bursts['num'][i], bursts['time'][i], 
                            strmeas(dt[-1], e_dt[-1]), 
                            strmeas(bursts['bfluen'][i], bursts['e_bfluen'][i]),
                            strmeas(bursts['alpha_obs'][i], bursts['e_alpha_obs'][i]),
                            strmeas(_alpha[0], _alpha[1], _alpha[2])))
                alpha.append(_alpha[0])
                e_alpha.append(_alpha[1])
                E_alpha.append(_alpha[2])
            else:
                # not sure what this case is for (excluded bursts?)
                dt.append(0.)
                e_dt.append(0.)
                alpha.append(0.)
                e_alpha.append(0.)
                E_alpha.append(0.)
                if show:
                    print ("{} & & {} & \\nodata & {} & \\nodata & \\nodata \\\\".format(
                        bursts['num'][i], bursts['time'][i],
                        strmeas(bursts['bfluen'][i], bursts['e_bfluen'][i])))

        bursts['trec'] = MaskedColumn(dt, mask=np.array(dt) <=0., unit=u.hr, 
            description='Burst recurrence time')
        bursts['e_trec'] = MaskedColumn(e_dt, mask=np.array(dt) <=0., unit=u.hr,
            description='Error on recurrence time')
        bursts['alpha_mod'] = MaskedColumn(alpha, mask=np.array(alpha) <= 0.,
            description='Model-informed alpha value')
        bursts['e_alpha_mod'] = MaskedColumn(e_alpha, mask=np.array(alpha) <= 0.,
            description='Lower limit on model alpha')
        bursts['E_alpha_mod'] = MaskedColumn(E_alpha, mask=np.array(alpha) <= 0.,
            description='Upper limit on model alpha')

        # set the formats here. These should be OK for most cases!
        bursts['trec'].info.format='5.2f'
        bursts['e_trec'].info.format='5.2f'
        bursts['alpha_mod'].info.format='6.2f'
        bursts['e_alpha_mod'].info.format='4.2f'
        bursts['E_alpha_mod'].info.format='4.2f'

        return bursts


[docs]    def do_analysis(self, options=['autocor','posteriors'],
                          part=None, truths=None, burnin=2000,
                          savefig=False):
        """
        This method is for running standard analysis and displaying the
        results.
        Nothing is returned, but various options for analysis are
        available, which will (optionally) populate some of the
        :class:`beansp.Beans` attributes, including

        | reader - sampler object read in from HDF file
        | sampler - chain data
        | nsteps_completed - number of steps completed
        | samples - flattened samples, omitting first samples_burnin
        | last - last walker positions
        | probs - likelihoods (total, prior, and contributions from each parameter) for the last walker positions
        | cc - ChainConsumer object with samples and derived cosi, gravity, redshift
        | cc_parameters - plot labels for cc object
        | model_pred - dictionary with model realisations read in from the "blobs"

	By default the method will also create several files, labeled by
        the run_id; drawn from

        | {}_autocorrelationtimes.pdf (via plot_autocorr)
        | {}_posteriors.pdf
        | {}_parameterconstraints_pred.txt

        TODO: need to reorganise a bit, and add more options

        :param options: array of strings corresponding to various analysis
          options, listed in the analyses dict below
	:param part: string or array "partition" dividing the set of
          samples into two or more separate groups for analysis
        :param truths: parameter vector to overplot on (one of the) corner
          plots (TODO: need to check if >1 corner plot are selected
          +truths, which will likely result in an error due to
          incompatible number of parameters)
        :param burnin: number of steps to discard when plotting the posteriors
        :param savefig: set to True to save figures to .pdf files, False to skip

        :return: none
        """

        # constants:
        c = const.c.to('cm s-1')
        G = const.G.to('cm3 g-1 s-2')

        # list of available analyses

        analyses = {'autocor': 'autocorrelation times as a function of timestep',
                    'chain': 'first 300 iterations of the chains',
                    'posteriors': 'raw posteriors and the input values',
                    'mrcorner': 'corner plot with M, R, g and 1+z',
                    'fig6': 'corner plot with xi_b, xi_p, d, Q_b, Z',
                    'fig8': 'xi_b vs. xi_p and models for comparison',
                    'converge': 'check the convergence via posterior evolution',
                    'comparison': 'observed and predicted burst times, fluences',
                    'last': 'analyse last walker positions' }

        if options == 'all':
            options = analyses.keys()

        # check the chosen option is one of those implemented

        for option in options:
            if option not in analyses.keys():
                print ('** ERROR ** {} is not an available analysis option; choose from'.format(option))
                for key in analyses.keys():
                    print ('  {}: {}'.format(key, analyses[key]))
                return

        if not hasattr(self, 'reader'):

            print ("Reading in samples...")# to calculate autocorrelation time...")

            # load in sampler:
            self.reader = emcee.backends.HDFBackend(filename=self.run_id+".h5")

            # Read in the full chain to get the number of steps completed
            self.sampler = self.reader.get_chain(flat=False)
            self.nsteps_completed = np.shape(self.sampler)[0]

            print ("... done. Got {} steps completed".format(self.nsteps_completed))
            self.samples_burnin = None
            self.models_burnin = None

        if (burnin != self.samples_burnin) | \
            (burnin != self.models_burnin):

            # moved burnin to be a parameter, so we can pass that from do_run
            # want to make sure we're using at least about 1000 samples for
            # our statistics

            # if burnin >= self.nsteps_completed*0.9:
            if (self.nsteps_completed*self.nwalkers-burnin < 1000) | \
                (self.nsteps_completed < burnin):
                print ('\n** WARNING ** discarding burnin {} will leave too few steps ({} total), ignoring'.format(burnin, self.nsteps_completed))
                burnin = 0

            # print ("Reading in flattened samples to show posteriors...")
            # samples = self.reader.get_chain(flat=True, discard=burnin)
            samples = self.sampler[burnin:,:,:]
            self.last = samples[-1,:,:]
            self.samples = samples.reshape((-1,self.ndim))
            self.samples_burnin = burnin

            cosi_2 = 1/(2*self.samples[:,5])
            cosi = 0.5/(2*(self.samples[:,5]/self.samples[:,4])-1)

            # here now create the overall chainconsumer object that will
            # enable the various posterior plots below

            labels = {"X": "$X$", "Z": "$Z$", "Qb": "$Q_b$ (MeV)",
                "d": "$d$ (kpc)", "xi_b": "$\\xi_b$", "xi_p": "$\\xi_p$"}

            if self.ndim >= 7:
                labels["M"] = "$M$ ($M_\odot$)"
                mass = self.samples[:,6]
                masspred = get_param_uncert(mass)
            if self.ndim >= 8:
                labels["R"] = "$R$ (km)"
                radius = self.samples[:,7]
                radiuspred = get_param_uncert(radius)

                # calculate redshift and gravity from mass and radius:
                # keep the parameters that we're going to calculate limits on
                # below, dimensionless

                R = np.array(radius)*1e5*u.cm #cgs
                M = np.array(mass)*const.M_sun.to('g') #cgs

                # ChainConsumer's plot method can't handle Quantity objects,
                # so we need to convert gravity and redshift back to numpy
                # arrays here
                redshift = np.power((1 - (2*G*M/(R*c**2))), -0.5).value
                gravity = (M*redshift*G/R**2 / (u.cm/u.s**2)).value #cgs

                redshiftpred = get_param_uncert(redshift)
                gravitypred = get_param_uncert(gravity)

            if self.ndim >= 9:
                labels["fE"] = "$f_E$"
            if self.ndim == 10:
                labels["fa"] = "$f_a$"


            # now create the chainconsumer object

            _plot_labels = labels
            _plot_labels['cosi'] = '$\cos i$'
            if self.ndim >= 8:
                _plot_labels['g'] = '$g$ (cm s$^{-2}$)'
                _plot_labels['1+z'] = '$1+z$'
                _samples =np.column_stack((self.samples, cosi, gravity, redshift))
            else:
                _samples =np.column_stack((self.samples, cosi))

            self.cc = ChainConsumer()
            # self.cc.add_chain(_samples, parameters=_labels)
            self.cc.add_chain(_samples, parameters=list(_plot_labels.values()),
                name=self.run_id)
            # configure params below copied from Adelle's jupyter notebook
            # we apply them here for consistency across all the posterior
            # plots
	    # despite the original sigmas setting, only 2 contours are
	    # shown...? (the first two, 1 & 2 sigma)
            self.cc.configure(usetex=True, serif=True, 
                flip=False, summary=False,
                bins=0.7, # has the effect of light smoothing of the histograms
                diagonal_tick_labels=False, max_ticks=3, shade=True, \
                shade_alpha=1.0 ,bar_shade=True, tick_font_size='xx-large', \
                label_font_size='xx-large',smooth=True, \
                sigma2d=False, sigmas=[1,2]) #np.linspace(0, 3, 4))
            self.samples = _samples # keep the samples up to date
            self.cc_parameters = _plot_labels
            self.cc_nchain = 1 # initially

	    # Now get the remainder of the parameter uncertainties and
	    # save to the text file

            Xpred = get_param_uncert(self.samples[:,0])
            Zpred = get_param_uncert(self.samples[:,1])
            basepred = get_param_uncert(self.samples[:,2])
            dpred = get_param_uncert(self.samples[:,3])
            cosipred = get_param_uncert(cosi)
            xibpred = get_param_uncert(self.samples[:,4])
            xippred = get_param_uncert(self.samples[:,5])

	    # save to text file with columns: value, upper uncertainty,
	    # lower uncertainty
            # have to have a few options here depending on whether the
            # mass is included or not
            # TODO also include f_E, f_a if they're included

            header='''beansp v{} parameter file
run_id {}, nsteps_completed={}, skipping {} steps for burnin

Each row has the 50th percentile value, upper & lower 68% uncertainties

Rows are:
H mass fraction (X), metallicity (Z), base flux (Q_b), distance (d, kpc),
cos i, persistent anisotropy factor (xi_p), burst anisotropy factor (xi_b)'''

            if self.ndim == 6:
                np.savetxt(f'{self.run_id}_parameterconstraints_pred.txt',
                    (Xpred, Zpred, basepred, dpred, cosipred, xippred, xibpred),
                    fmt='%9.6f', header=header.format(__version__, self.run_id, self.nsteps_completed,self.samples_burnin))
            elif self.ndim == 7:
                header = header+',\nNS mass (M_sun)'
                np.savetxt(f'{self.run_id}_parameterconstraints_pred.txt',
                    (Xpred, Zpred, basepred, dpred, cosipred, xippred, xibpred,
                    masspred), fmt='%9.6f', header=header.format(__version__, self.run_id, self.nsteps_completed,self.samples_burnin,))
            else:
                header = header+', NS radius (km), gravity (g, 10^14 cm/s^2), redshift (1+z)'
                np.savetxt(f'{self.run_id}_parameterconstraints_pred.txt',
                    (Xpred, Zpred, basepred, dpred, cosipred, xippred, xibpred,
                    masspred, radiuspred, gravitypred/1e14, redshiftpred),
                    fmt='%9.6f', header=header.format(__version__, self.run_id, self.nsteps_completed,self.samples_burnin))

        # ---------------------------------------------------------------------#
        if 'last' in options:

            # show likelihood contributions for last step
	    # TODO could also use the reader.get_last_sample method, at
	    # least for p_tot, but this won't give you the likelihood
            # contributions. It does include as the 4th element the prior
            # and model realisations (blobs) though

            probs = pd.DataFrame(columns = ['p_tot','prior','p_time','p_fluen','p_alpha'],
                index = np.arange(self.nwalkers) )
            p_fluen, p_alpha = 0.0, 0.0
            for _i in np.arange(np.shape(self.last)[0]):
                ptot, model = self.lnlike(self.last[_i,:], None, self.y, self.yerr, components=True)
                ato = int(self.train)
                p_time = -0.5*np.sum(model['cpts'][:self.numburstsobs-ato])
                if self.cmpr_fluen:
                    p_fluen = -0.5*np.sum(model['cpts'][self.numburstsobs-ato:2*self.numburstsobs-ato])
                if self.cmpr_alpha:
                    p_alpha = -0.5*np.sum(model['cpts'][2*self.numburstsobs-ato:])
                pprior = self.lnprior(self.last[_i,:])
                probs.loc[_i] = [ptot, pprior, p_time, p_fluen, p_alpha]

            self.probs = probs

        # ---------------------------------------------------------------------#
        # PLOTS
        # ---------------------------------------------------------------------#

        if 'autocor' in options:

            # plot autocorrelation times

            if savefig:
                self.plot_autocorr(reader=self.reader, savefile='{}_autocorrelationtimes.pdf'.format(self.run_id))
            else:
                self.plot_autocorr(reader=self.reader, savefile=None)
                print ('Skipping autocorrelation plot save')
            print ("...done")

        #sampler = emcee.EnsembleSampler(self.nwalkers, self.ndim, self.lnprob, args=(self.x, self.y, self.yerr), backend=reader)

        # ---------------------------------------------------------------------#
        if 'chain' in options:

            # plot the chains:

            print ("Plotting the chains...")
            labels = ["$X$","$Z$","$Q_b$","$d$", "$\\xi_b$", "$\\xi_p$", "$M$", "$R$","$f_E$", "$f_a$"]
            # plt.clf()
            fig, axes = plt.subplots(self.ndim, 1, sharex=True, figsize=(8, 9))

            for i in range(self.ndim):
                # Previously the transposed sampler object below meant
                # that we were plotting with walker number on the x-axis,
                # instead of step. Now fixed
                axes[i].plot(self.sampler[:,:,i], color="k", alpha=0.4)
                axes[i].yaxis.set_major_locator(MaxNLocator(5))
                axes[i].set_ylabel(labels[i])

            axes[self.ndim-1].set_xlabel("step number")
            plt.tight_layout(h_pad=0.0)
            if savefig:
                print ('Saving chain plot to {}chain-plot.pdf'.format(self.run_id))
                plt.savefig(self.run_id+'chain-plot.pdf')
            else:
                print ('Skipping chain plot save')

            plt.show()
            print ("...done")

        # ---------------------------------------------------------------------#
        if 'posteriors' in options:

            # make plot of posterior distributions of your parameters:
            # (using the already-created ChainConsumer object)

            if truths is None:
                truths = list(self.theta)

            if savefig:
                self.cc.plotter.plot(parameters=list(self.cc_parameters.values())[:self.ndim],
                    filename=self.run_id+"_posteriors.pdf",
                    figsize="page", truth=truths)
            else:
                fig = self.cc.plotter.plot(parameters=list(self.cc_parameters.values())[:self.ndim],
                    figsize="page", truth=truths)
                fig.show()
            print ("...done")

        # ---------------------------------------------------------------------#
        if ('mrcorner' in options) & (self.ndim < 8):
            print ('** ERROR ** can''t show M-R posteriors as one or both of M & R are fixed')
        elif 'mrcorner' in options:

            # mrgr = np.column_stack((mass, radius, gravity, redshift))

            # plot with chainconsumer:
            # cc = ChainConsumer()
            # cc.add_chain(mrgr, parameters=["M", "R", "g", "1+z"])
            if savefig:
                self.cc.plotter.plot(parameters=[self.cc_parameters[x] for x in ["M", "R", "g", "1+z"]],
                    filename=self.run_id+"_massradius.pdf",
                    truth=truths, figsize="page")
            else:
                fig = self.cc.plotter.plot(parameters=[self.cc_parameters[x] for x in ["M", "R", "g", "1+z"]],
                    figsize="page", truth=truths)
                fig.show()

        # ---------------------------------------------------------------------#
        if 'fig6' in options:

            # fig6data = np.column_stack((xip, xib, distance, base, Z, X))
            # fig6data = np.column_stack((X, Z, base, distance, xib, xip))

            # plot with chainconsumer:

            # cc = ChainConsumer()

            # cc.add_chain(fig6data, parameters=["X", "$Z$", "$Q_b$ (MeV)",
            #     "$d$ (kpc)", "$\\xi_b$", "$\\xi_p$"])\
            if savefig:
                self.cc.plotter.plot(
                    parameters=[self.cc_parameters[x] for x in ['X','Z','Qb','d','xi_b','xi_p']],
                    filename=self.run_id+"_fig6.pdf",
                    truth=truths, figsize="page")
            else:
                fig = self.cc.plotter.plot(
                    parameters=[self.cc_parameters[x] for x in ['X','Z','Qb','d','xi_b','xi_p']],
                    truth=truths, figsize="page")
                fig.show()

        # ---------------------------------------------------------------------#
        if ('converge' in options):

            # do the summary plot, comparing the two halves of the burnin

            _cc = ChainConsumer()
            _n = int(np.shape(self.samples)[0]/2)
            _cc.add_chain(self.samples[:_n,:self.ndim],
                parameters=list(self.cc_parameters.keys())[:self.ndim],
                name='{}-{}'.format(self.samples_burnin,
                self.samples_burnin+int(_n/self.nwalkers)))
            _cc.add_chain(self.samples[_n:,:self.ndim],
                parameters=list(self.cc_parameters.keys())[:self.ndim],
                name='{}-{}'.format(self.samples_burnin+int(_n/self.nwalkers),
                self.nsteps_completed))
            if savefig:
                _cc.plotter.plot_summary(
                    filename=self.run_id+"_converge.pdf")#,figsize="page")
            else:
                fig = _cc.plotter.plot_summary()#figsize="page")
                fig.show()

        # ---------------------------------------------------------------------#
        if ('comparison' in options) & (self.models_burnin != burnin):

            # and finally read in the model realisations
            # This loop can take a LOOOOOONG time for long runs

            print ("Reading in and processing blobs, ignoring first {}...".format(burnin))
            blobs = self.reader.get_blobs(flat=True)

            # Get predictions for each model run from the blobs structure:

            time, e_b, alpha, mdot = [], [], [], []
            # X = [] # just for testing; won't be included in future blobs
            for i in range(burnin*self.nwalkers, len(blobs["model"])):
                _model = eval(blobs["model"][i].decode('ASCII', 'replace'))
                time.append(_model['time'])
                e_b.append(_model['e_b'])
                alpha.append(_model['alpha'])
                mdot.append(_model['mdot'])
                # X.append(_model['x_0'][0])
            print ("...done")

            # to get the parameter middle values and uncertainty use the
            # functions get_param_uncert_obs and get_param_uncert_part
            # e.g.

            numbursts_pred = [len(x) for x in time]
            # special here for the base20 run, to 3500 steps at least;
            # more generally want to have a way of doing this on the fly
            # part = ['loX-36' if ((_n == 36) & (self.samples[i,0] < 0.3)) 
            #     else 'loX-37' if ((_n == 37) & (self.samples[i,0] < 0.3)) 
            #     else 'hiX' #if (self.samples[i,0] > 0.3)
            #     for i, _n in enumerate(numbursts_pred)]
            if (part is None): # & (len(set(numbursts_pred)) > 1):
                part = numbursts_pred
            times = get_param_uncert_part(time, partition=part)

            # Here we calculate the parameter uncertainties on the
            # predcted fluences, for comparison with the observations

            # this fails with inhomogeneous arrays; need to do something
            # a bit more complicated
            # fpred = (np.array(e_b).T*self.fluen_fac/np.array(xib)/np.array(distance)**2).T
            fpred = [list(np.array(_e_b)*self.fluen_fac/self.samples[_i,4]/self.samples[_i,3]**2) for _i, _e_b in enumerate(e_b)]
            ebs = get_param_uncert_part(fpred, partition=part)

            alphas = get_param_uncert_part(alpha, partition=part)

	    # store these parameters and flag it so we don't need to
	    # calculate them again (unless burnin changes)

            # part_stats = None
            # if part is not None:
            #     part_stats = {x: len(np.where(np.array(part) == x)[0]) for x in set(part)}
            part_stats = {x: len(np.where(np.array(part) == x)[0]) for x in times.keys()}
            self.model_pred = { 'mdot': mdot,
                'times': time, 'time_stats': times,
                'numbursts': numbursts_pred, 'partition': part,
                'part_stats': part_stats,
                'e_b': e_b, 'e_b_stats': ebs,
                'alpha': alpha, 'alpha_stats': alphas }
            self.models_burnin = burnin

            # Here also we modify the ChainConsumer object if we have
            # multiple models

            if (len(times) != self.cc_nchain) & (part is not None):
                self.cc = ChainConsumer()
                self.cc_nchain = 0
                for _n in set(part):
                    # need to check that there are sufficient samples here
                    _sel = np.array(part) == _n
                    _check = np.shape(self.samples[_sel])[0]
                    if _check > 1000:
                        self.cc.add_chain(self.samples[_sel],
                            # name='{} bursts'.format(_n),
                            name = _n if type(_n) == str else str(_n),
                            parameters=list(self.cc_parameters.values()))
                        self.cc_nchain += 1
                    else:
                      print ('Skipping walkers for n={}, too few samples ({})'.format(_n, _check))
                print ('Updated chain object with {} model classes'.format(self.cc_nchain))

        # ---------------------------------------------------------------------#
        if 'fig8' in options:

            # here we read in data from the anisotropy models. There's
            # probably a better way to do this, via concord (if it's
            # available)

            counts, ybins, xbins, image = plt.hist2d(self.samples[:,5],
                self.samples[:,4], bins=500, norm=LogNorm(), cmap='OrRd')

            xi_p_model2 = np.arange(0, 2.5, 0.01)
            xi_b_model2 = np.empty(len(xi_p_model2))

            for i in range(0,250):

                xi_b_model2[i] = 1./((1./(2*xi_p_model2[i])) + 0.5)

            # overplot the various models

            plt.plot(xi_p_model2, xi_b_model2, color = 'black',ls='-', label = 'Fujimoto (1988)')

            if Beans.HAS_CONCORD:
                # setup dict with list of models, legend labels and linestyles
                he16_models = {'he16_a': ('He \& Keek (2016) model A', '--'),
                               'he16_b': ('model B', '-.'),
                               'he16_c': ('model C', (0, (3, 5, 1, 5))),
                               'he16_d': ('model D', (0, (1, 5))) }

                for model in he16_models.keys():

                    _model = self.cd.diskmodel.load_he16(model)

                    model_theta = _model['col1']
                    model_xid = _model['col2']
                    model_xir = _model['col3']
                    model_xip1 = _model['col4']
                    model_xib1 = model_xid + model_xir

                    model_xib = 1./model_xib1
                    model_xip = 1./model_xip1

                    #modela:
                    plt.plot(model_xip, model_xib, color='darkblue',
                        ls=he16_models[model][1], label=he16_models[model][0])

            else:
                print ('''
** WARNING ** install concord if you want to overplot model curves
              See https://github.com/outs1der/concord''')

            plt.xlabel(r'$\xi_{\mathrm{p}}$',fontsize='xx-large')
            plt.ylabel(r'$\xi_{\mathrm{b}}$',fontsize='xx-large')

            plt.legend(loc='best',fontsize='large')

            plt.axis([0.,2.1,0.,2.1])

            plt.xticks(fontsize=14)
            plt.yticks(fontsize=14)

            if savefig:
                plt.savefig('{}_xipvsxib_models_contourlines.pdf'.format(self.run_id))
            else:
                plt.show()

        # ---------------------------------------------------------------------#
        if 'comparison' in options:

            # make plot of observed burst comparison with predicted bursts:

            plt.figure(figsize=(10,7))

            # copy colors from plot method for consistency

            bursts_colour = 'tab:blue'
            obs_colour = 'tab:grey'

            # plt.scatter(self.bstart, self.fluen, color = 'black', marker = '.', label='Observed', s =200)
            if self.train:
                # 2-panel plot like in plot

                fig, axs = plt.subplot_mosaic([['main'],['main'],['resid']], sharex=True)
                ax1 = axs['main']

                ax1.errorbar(self.bstart[self.ifluen], self.fluen[self.ifluen],
                    yerr=self.fluene[self.ifluen],
                    color=obs_colour, linestyle='', marker='.', ms=13,
                    label='observed')
                # non-redundant option for missing fluence values
                for i in range(self.numburstsobs):
                    if (i not in self.ifluen) & (i != self.ref_ind):
                        ax1.axvline(self.bstart[i], color=obs_colour, ls='--')
                ax1.axvline(self.bstart[self.ref_ind], c='k', ls='--')

                if self.gti_checking:
                    #plot satellite gtis
                    for i in range(1,len(self.st)):
                        ax1.axvspan(self.st[i],self.et[i],facecolor='0.5', alpha=0.2)
                    ax1.axvspan(self.st[0],self.et[0], facecolor='0.5',alpha=0.2,label='Satellite GTIs')

                times = self.model_pred['time_stats']
                ebs = self.model_pred['e_b_stats']
                # loop over all the different solutions
                _label = 'matched'
                for i, numburstssim in enumerate(times.keys()):
                    # print (i, numburstssim, times, ebs)
                    timepred = [x[0] for x in times[numburstssim]]
                    timepred_errup = [x[1] for x in times[numburstssim]]
                    timepred_errlow = [x[2] for x in times[numburstssim]]
                    ebpred = [x[0] for x in ebs[numburstssim]]
                    ebpred_errup = [x[1] for x in ebs[numburstssim]]
                    ebpred_errlow = [x[2] for x in ebs[numburstssim]]
                    ax1.errorbar(timepred[1:], ebpred,
                        yerr=[ebpred_errup, ebpred_errlow],
                        # xerr=[timepred_errup[1:], timepred_errlow[1:]],
                        marker='*', ms=11, linestyle='', color='C{}'.format(i),
                        label='predicted ({})'.format(numburstssim))

                    ref_tpred = np.argmin(np.abs(self.bstart[self.ref_ind]-timepred))
                    imatch = burst_time_match(self.ref_ind, self.bstart,
                        ref_tpred, np.array(timepred))
                    print (numburstssim, imatch)
                    # Not sure this will work so well if there are
                    # multiple sets of solutions
                    # if len(times.keys()) == 1:
                    imatchm1 = [x-1 for x in imatch if x-1 >= 0]
                    ax1.plot(np.array(timepred[1:])[imatchm1], 
                        np.array(ebpred)[imatchm1],
                        marker='*', ms=5, linestyle='', color='tab:red',
                        label=_label,zorder=99)
                    _label = None # only give the label the first time

                    resid = -(self.bstart-np.array(timepred)[imatch])*24.
                    axs['resid'].errorbar(self.bstart, resid,
                        yerr=[np.array(timepred_errup)[imatch]*24.,
                        np.array(timepred_errlow)[imatch]*24.],
                        marker='*', ms=11, linestyle='', color='C{}'.format(i))
                    print ('RMS obs-model offset ({}, {:.2f}%) = {:.4f} hr'.format(
                        numburstssim, 100.*self.model_pred['part_stats'][numburstssim]/len(self.samples), 
                        np.sqrt(np.mean(resid**2))))

                ax1.set_ylabel("Fluence ($10^{-6}\\,{\\rm erg\\,cm^{-2}}$)")
                axs['resid'].axhline(0.0, color=obs_colour, ls='--')
                axs['resid'].set_ylabel('Time offset (hr)')
                axs['resid'].set_xlabel("Time (days after MJD {})".format(self.tref))
                ax1.legend(loc=2)

            else:
                # different style plot for the ensemble mode; the bstart
                # still records the burst time (epoch) but now we prefer
                # to plot vs. recurrence time
                timepred = [x[0] for x in times]
                timepred_errup = [x[1] for x in times]
                timepred_errlow = [x[2] for x in times]
                ebpred = [x[0] for x in ebs]
                ebpred_errup = [x[1] for x in ebs]
                ebpred_errlow = [x[2] for x in ebs]
                plt.errorbar(self.tdel, self.fluen, yerr=self.fluene,
                    color='black', linestyle='', marker='.', ms=13, label='Observed')
                plt.scatter(timepred, ebpred, marker='*', color=bursts_colour, s=100, label='Predicted')
                plt.errorbar(timepred, ebpred,
                    yerr=[ebpred_errup, ebpred_errlow],
                    xerr=[timepred_errup, timepred_errlow], fmt='.',
                    color=bursts_colour)
                plt.xlabel("Recurrence time (hr)")

                plt.ylabel("Fluence ($10^{-6}\\,{\\rm erg\\,cm^{-2}}$)")
                plt.legend(loc=2)

            if savefig:
                print ('Saving burst comparison plot to {}_predictedburstscomparison.pdf'.format(self.run_id))
                fig.savefig(f'{self.run_id}_predictedburstscomparison.pdf')
            else:
                print ('Skipping burst comparison plot save')
            fig.show()

    def prune(self, key=None, nwalkers=None, scale=0.0, savefile=None):
        '''
        This method will "prune" the walkers to keep only one set of
        solutions. It is necessary that :meth:`Beans.do_analysis` has
        already been called, with the `comparison` option, to identify the
        model classes.

        The method will return the new set of positions, and optionally
        save them to a pickle file

        :param key: model class to keep, usually labeled by the number of predicted bursts
        :param nwalkers: number of samples to generate, if not the current number of walkers
        :param scale: in case it's necessary to distribute the walker positions around the seed values, this parameter sets the Gaussian scale
        :param savefile: name of pickle file to save to

        :returns: array of walker positions, dimensions (nwalkers, ndim)
        '''

        if not hasattr(self, 'model_pred'):
            print ('** ERROR ** no model predictions available, run the comparison first')
            return None

        if key is None:
            print ("** ERROR ** no key supplied, don't know which set to keep")
            return None

        if not (key in set(self.model_pred['partition'])):
            print ("** ERROR ** key not present in model prediction set: {}".format(set(self.model_pred['partition'])))
            return None

        new_pos, d1, d2, d3 = self.reader.get_last_sample()

        # now redistribute the "bad" walkers

        bad = np.array(self.model_pred['partition'])[-self.nwalkers:] != key

        print ('Redistributing {} of {} walkers...'.format(len(np.where(bad)[0]), self.nwalkers))

        for i in (np.where(bad)[0]):
            new_pos[i] = new_pos[np.random.choice(np.where(~bad)[0])] + scale*np.random.randn(self.ndim)

        if savefile is not None:
            print ('Saving positions to {}'.format(savefile))
            pickle.dump(new_pos, open(savefile, 'wb'))

        return new_pos


# end of beans.py