Source code for radvel.prior

from __future__ import annotations

import warnings
from typing import Callable

import numpy as np
from scipy.stats import gaussian_kde, norm

from radvel import model
from radvel import orbit
from radvel import utils


class Prior(object):

    # By default, priors are not extra constraints.
    # They should specify if they are.
    # Relevant only for nested sampling.
    extra_constraint: bool = False

    def __repr__(self) -> str:
        return "Generic Prior"



[docs]
class Gaussian(Prior):
    """Gaussian prior

    Guassian prior on a given parameter.

    Args:
        param (string): parameter label
        mu (float): center of Gaussian prior
        sigma (float): width of Gaussian prior
    """

    def __init__(self, param: str, mu: float, sigma: float):
        self.mu = mu
        self.sigma = sigma
        self.param = param

    def __call__(self, params: model.Parameters, vector: model.Vector) -> float:
        x = vector.vector[vector.indices[self.param]][0]
        return -0.5 * ((x - self.mu) / self.sigma)**2 - 0.5*np.log((self.sigma**2)*2.*np.pi)

    def transform(self, u: float) -> float:
        return norm.ppf(u, loc=self.mu, scale=self.sigma)

    def __repr__(self) -> str:
        s = "Gaussian prior on {}, mu={}, sigma={}".format(
            self.param, self.mu, self.sigma
            )
        return s

    def __str__(self) -> str:
        try:
            tex = model.Parameters(9).tex_labels(param_list=[self.param])[self.param]

            s = "Gaussian prior on {}: ${} \\pm {}$ \\\\".format(tex, self.mu, self.sigma)
        except KeyError:
            s = self.__repr__()

        return s




[docs]
class EccentricityPrior(Prior):
    """Physical eccentricities

    Prior to keep eccentricity between 0 and a specified upper limit.

    Args:
        num_planets (int or list): Planets to apply the eccentricity prior.
            If an integer is given then all planets with indexes up to and including
            the specified integer will be included in the prior. If a list is given then
            the prior will only be applied to the specified planets.
        upperlims (float or list of floats): List of eccentricity upper limits to assign
            to each of the planets. If a float is given then all planets must have
            eccentricities less than this value. If a list of floats is given then
            each planet can have a different eccentricity upper limit.
    """

    extra_constraint: bool = True

    def __repr__(self) -> str:
        msg = ""
        for i, num_planet in enumerate(self.planet_list):
            msg += "e{} constrained to be < {}\n".format(num_planet, self.upperlims[i])

        return msg[:-1]

    def __str__(self) -> str:
        tex = model.Parameters(9, basis='per tc e w k').tex_labels()

        msg = ""
        for i, num_planet in enumerate(self.planet_list):
            par = "e{}".format(num_planet)
            label = tex[par]
            msg += "{} constrained to be $<{}$ \\\\\\\\\n".format(label, self.upperlims[i])

        return msg[:-5]

    def __init__(self, num_planets: int | list[int], upperlims: float = 0.99) -> None:

        if type(num_planets) == int:
            self.planet_list = range(1, num_planets+1)
            npl = num_planets
        else:
            self.planet_list = num_planets
            npl = len(self.planet_list)

        if type(upperlims) == float:
            self.upperlims = [upperlims] * npl
        else:
            assert len(upperlims) == len(self.planet_list), "Number of eccentricity \
upper limits must match number of planets."
            self.upperlims = upperlims

    def __call__(self, params: model.Parameters, vector: model.Vector, finite: bool = False) -> float:
        def _getpar(key: str, num_planet: int) -> float:
            return vector.vector[vector.indices['{}{}'.format(key, num_planet)]][0]

        parnames = params.basis.name.split()

        for i, num_planet in enumerate(self.planet_list):
            if 'e' in parnames:
                ecc = _getpar('e', num_planet)
            elif 'secosw' in parnames:
                secosw = _getpar('secosw', num_planet)
                sesinw = _getpar('sesinw', num_planet)
                ecc = secosw**2 + sesinw**2
            elif 'ecosw' in parnames:
                ecosw = _getpar('ecosw', num_planet)
                esinw = _getpar('esinw', num_planet)
                ecc = np.sqrt(ecosw**2 + esinw**2)
            elif 'se' in parnames:
                secc = _getpar('se',num_planet)
                ecc = secc**2

            if ecc > self.upperlims[i] or ecc < 0.0:
                return -np.inf if not finite else -1e100

        return -np.sum(np.log(self.upperlims))

    def transform(self, u: float | np.ndarray) -> None:
        raise NotImplementedError(
            "EccentricityPrior places an extra_constraint on existing parameters. "
            "It will be called by 'extra_likelihood' and not as a prior transform. "
            "If your basis uses eccentricity directly and your only constraint is U(0, 1), use HardBounds."
        )




[docs]
class PositiveKPrior(Prior):
    """K must be positive

    A prior to prevent K going negative.
    Be careful with this as it can introduce a bias to larger K
    values.

    Args:
        num_planets (int): Number of planets. Used to ensure K for each
            planet is positive
    """

    extra_constraint = True

    def __repr__(self) -> str:
        return "K constrained to be > 0"

    def __str__(self) -> str:
        return "$K$ constrained to be $>0$"

    def __init__(self, num_planets: int) -> None:
        self.num_planets = num_planets

    def __call__(self, params: model.Parameters, vector: model.Vector, finite: bool = False) -> float:
        def _getpar(key: str, num_planet: int) -> float:
            return vector.vector[vector.indices['{}{}'.format(key, num_planet)]][0]

        for num_planet in range(1, self.num_planets+1):
            try:
                k = _getpar('k', num_planet)
            except KeyError:
                k = np.exp(_getpar('logk', num_planet))

            if k < 0.0:
                return -np.inf if not finite else -1e100
        return 0

    def transform(self, u: float | np.ndarray) -> None:
        raise NotImplementedError(
            "PositiveKPrior places an extra_constraint on existing parameters. "
            "It will be called by 'extra_likelihood' and not as a prior transform. "
            "If your only constraint for K is (0, 1), use HardBounds (or a log-scale prior)"
        )




[docs]
class HardBounds(Prior):
    """Prior for hard boundaries

    This prior allows for hard boundaries to be established
    for a given parameter.

    Args:
        param (string): parameter label
        minval (float): minimum allowed value
        maxval (float): maximum allowed value
    """

    def __init__(self, param: str, minval: float, maxval: float) -> None:
        self.minval = minval
        self.maxval = maxval
        self.param = param

        self.finite = True

        if not np.isfinite(self.minval) or not np.isfinite(self.maxval):
            warnings.warn("Non-finite boundary given to HardBounds. Your likelihood will not be properly normalized.",
                          UserWarning)
            self.finite = False

    def __call__(self, params: model.Parameters, vector: model.Vector) -> float:
        x = vector.vector[vector.indices[self.param]][0]
        if x <= self.minval or x >= self.maxval:
            return -np.inf
        else:
            if self.finite:
                return -np.log(self.maxval-self.minval)
            else:
                return 0

    def transform(self, u: float | np.ndarray) -> float | np.ndarray:
        if not self.finite:
            raise ValueError("Prior transform for HardBounds requires finite boundaries")
        return self.minval + u * (self.maxval - self.minval)

    def __repr__(self) -> str:
        s = "Bounded prior on {}, min={}, max={}".format(
            self.param, self.minval, self.maxval
            )
        return s

    def __str__(self) -> str:
        try:
            tex = model.Parameters(9).tex_labels(param_list=[self.param])[self.param]

            s = "Bounded prior: ${} < {} < {}$".format(self.minval,
                                                       tex.replace('$', ''),
                                                       self.maxval)
        except KeyError:
            s = self.__repr__()

        return s




[docs]
class SecondaryEclipsePrior(Prior):
    """Secondary eclipse prior

    Implied prior on eccentricity and omega by specifying measured secondary eclipse time

    Args:
        planet_num (int): Number of planet with measured secondary eclipse
        ts (float): Secondary eclipse midpoint time.
            Should be in the same units as the timestamps of your data.
        ts_err (float): Uncertainty on secondary eclipse time
    """

    extra_constraint = True

    def __repr__(self) -> str:
        msg = ""
        msg += "secondary eclipse constraint: {} +/- {}\n".format(self.ts, self.ts_err)

        return msg[:-1]

    def __str__(self) -> str:
        msg = "secondary eclipse prior: ${} \\pm {}$ \\\\\\\\\n".format(self.ts, self.ts_err)

        return msg[:-5]

    def __init__(self, planet_num: int, ts: float, ts_err: float) -> None:

        self.planet_num = planet_num
        self.ts = ts
        self.ts_err = ts_err

    def __call__(self, params: model.Parameters, vector: model.Vector) -> float:
        def _getpar(key):
            return synth_params[vector.indices['{}{}'.format(key, self.planet_num)]][0]

        synth_params = vector.params.basis.v_to_synth(vector)

        tp = synth_params[-4+(5*self.planet_num)][0]
        per = synth_params[-5+(5*self.planet_num)][0]
        ecc = synth_params[-3+(5*self.planet_num)][0]
        omega = synth_params[-2+(5*self.planet_num)][0]

        ts = orbit.timeperi_to_timetrans(tp, per, ecc, omega, secondary=True)
        ts_phase = utils.t_to_phase_vector(vector, ts, self.planet_num)

        pts = utils.t_to_phase_vector(vector, self.ts, self.planet_num)
        epts = self.ts_err / per

        penalty = -0.5 * ((ts_phase - pts) / epts)**2 - 0.5*np.log((epts**2)*2.*np.pi)

        return penalty

    def transform(self, u: float | np.ndarray) -> None:
        raise NotImplementedError(
            "SecondaryEclipsePrior places an extra_constraint on existing parameters. "
            "It will be called by 'extra_likelihood' and not as a prior transform. "
            "If your only constraint for K is (0, 1), use HardBounds (or a log-scale prior)"
        )




[docs]
class Jeffreys(Prior):
    """Jeffrey's prior

    This prior follows the distribution:

    .. math::
        p(x) \\propto \\frac{1}{x}

    with upper and lower bounds to prevent singularity at :math:`x=0`.

    Args:
        param (string): parameter label
        minval (float): minimum allowed value
        maxval (float): maximum allowed value
    """

    def __init__(self, param: str, minval: float, maxval: float) -> None:
        self.minval = minval
        self.maxval = maxval
        self.param = param

        self.normalization = 1./np.log(self.maxval/self.minval)

    def __call__(self, params: model.Parameters, vector: model.Vector) -> float:
        x = vector.vector[vector.indices[self.param]][0]
        if x < self.minval or x > self.maxval:
            return -np.inf
        else:
            return np.log(self.normalization) - np.log(x)

    def transform(self, u: float | np.ndarray) -> float | np.ndarray:
        return self.minval * np.exp(u * np.log(self.maxval / self.minval))

    def __repr__(self) -> str:
        s = "Jeffrey's prior on {}, min={}, max={}".format(
            self.param, self.minval, self.maxval
            )
        return s
    def __str__(self) -> str:
        try:
            tex = model.Parameters(9).tex_labels(param_list=[self.param])[self.param]

            s = "Jeffrey's prior: ${} < {} < {}$".format(self.minval,
                                                       tex.replace('$',''),
                                                       self.maxval)
        except KeyError:
            s = self.__repr__()

        return s




[docs]
class ModifiedJeffreys(Prior):
    """Modified Jeffry's prior

    This prior follows the distribution:

    .. math::
        p(x) \\propto \\frac{1}{x-x_0}

    with upper bound.

    Args:
        param (string): parameter label
        kneeval (float): "knee" of Jeffrey's prior (:math:`x_0` in eq above)
        minval (float): minimum allowed value. `minval` must be larger than `kneeval`
        maxval (float): maximum allowed value

    """

    def __init__(self, param: str, minval: float, maxval: float, kneeval: float) -> None:
        self.maxval = maxval
        self.param = param
        self.kneeval = kneeval
        self.minval = minval

        self.normalization = 1./np.log((self.maxval-self.kneeval)/(self.minval-self.kneeval))

        assert self.minval > self.kneeval, "ModifiedJeffreys prior requires minval>kneeval."

    def __call__(self, params: model.Parameters, vector: model.Vector) -> float:
        x = vector.vector[vector.indices[self.param]][0]
        if (x > self.maxval) or (x < self.minval):
            return -np.inf
        else:
            return np.log(self.normalization) - np.log(x-self.kneeval)

    def transform(self, u: float | np.ndarray) -> float | np.ndarray:
        return self.kneeval + (self.minval - self.kneeval) * np.exp(u / self.normalization)

    def __repr__(self) -> str:
        s = "Modified Jeffrey's prior on {}, knee={}, min={}, max={}".format(
            self.param, self.kneeval, self.minval, self.maxval
            )
        return s
    def __str__(self) -> str:
        try:
            tex = model.Parameters(9).tex_labels(param_list=[self.param])[self.param]

            s = "Modified Jeffrey's prior: knee = {}; ${} < {} < {}$".format(
                self.kneeval, self.minval, tex.replace('$',''), self.maxval
                )
        except KeyError:
            s = self.__repr__()

        return s



[docs]
class NumericalPrior(Prior):
    """Prior defined by an input array of values

    Wrapper for scipy.stats.gaussian_kde.

    This prior uses Gaussian Kernel Density Estimation to
    estimate the probability density function from which
    a set of values are randomly drawn.

    Useful for defining a prior given a posterior obtained
    from a complementary fitting process. For example, you
    might use transit data to obtain constraints on secosw and
    sesinw, then use the posterior on secosw as a prior for
    a RadVel fit.

    Args:
        param_list (list of str): list of parameter label(s).
        values (numpy array of float): values of ``param`` you
            wish to use to define this prior. For example, this
            might be a posterior array of values of secosw
            derived from transit data. In case of univariate data
            this is a 1-D array, otherwise a 2-D array with shape
            (# of elements in param_list, # of data points).
        bw_method (str, scalar, or callable [optional]): see
            scipy.stats.gaussian_kde
        bins (int [optional]): number of bins for the histogram when creating
            nested sampling prior transform. Defaults to 100.

    Note: the larger the input array of values, the longer it will
    take for calls to this prior to be evaluated. Consider thinning
    large input arrays to speed up performance.

    """

    def __init__(self, param_list: list[str], values: np.ndarray, bw_method: str | float | None = None, bins: int | str = 'auto') -> None:
        self.param_list = param_list
        self.pdf_estimate = gaussian_kde(values, bw_method=bw_method)
        # Ref (and source code) for the histogram: https://johannesbuchner.github.io/UltraNest/priors.html#Non-analytic-priors
        hist, bin_edges = np.histogram(values, bins=bins)
        self.hist_cumulative = np.cumsum(hist / hist.sum())
        self.bin_middle = (bin_edges[:-1] + bin_edges[1:]) / 2

    def __call__(self, params: model.Parameters, vector: model.Vector) -> float:
        x = []
        for param in self.param_list:
            x.append(vector.vector[vector.indices[param]][0])
        val = np.log(self.pdf_estimate(x))
        return val[0]

    def transform(self, u: float | np.ndarray) -> float | np.ndarray:
        return np.interp(u, self.hist_cumulative, self.bin_middle)

    def __repr__(self) -> str:
        s = "Numerical prior on {}".format(
            self.param_list
            )
        return s

    def __str__(self) -> str:
        try:
            tex = model.Parameters(9).tex_labels(param_list=self.param_list)
            t=[tex[key] for key in tex.keys()]
            if len(self.param_list) == 1:
                str2print = '{0}'.format(*t)
            elif len(self.param_list) == 2:
                str2print = '{} and {}'.format(*t)
            else:
                str2print = ''
                for el in np.arange(len(self.param_list) - 1):
                    str2print += '{}, '.format(t[el])
                str2print += 'and {}'.format(t[el+1])
            s = "Numerical prior on " + str2print + \
                ", defined using Gaussian kernel density estimation."
        except KeyError:
            s = self.__repr__()

        return s




[docs]
class UserDefinedPrior(Prior):
    """Interface for user to define a prior
       with an arbitrary functional form.

    Args:
        param_list (list of str): list of parameter label(s).
        func (function): a Python function that takes in  a list
            of values (ordered as in ``param_list``), and returns
            the corresponding log-value of a pdf.
        tex_rep (str): TeX-readable string representation of
            this prior, to be passed into radvel report and
            plotting code.
        transform_func (function): a Python function that takes a unit cube
            with dimension equal to the number of parameters in
            param_list, and returns samples from the prior.
            This is usually the inverse-cdf of func.
            Set to None by default. In that case the prior cannot
            be used for Nested Sampling.

    Example:
        >>> def myPriorFunc(inp_list):
        ...     if inp_list[0] > 0. and inp_list[0] < 1.:
        ...         return 0.
        ...     else:
        ...         return -np.inf
        >>> myTexString = 'Uniform Prior on $\\sqrt{e}$'
        >>> myPrior = radvel.prior.UserDefinedPrior(['se'], myPriorFunc, myTexString)

    Note:
        ``func`` must be properly normalized; i.e. integrating over the
        entire parameter space must give a probability of 1.
    """

    def __init__(self, param_list: list[str], func: Callable, tex_rep: str, transform_func: Callable | None = None) -> None:
        self.param_list = param_list
        self.func = func
        self.transform_func = transform_func
        self.tex_rep = tex_rep

    def __call__(self, params: model.Parameters, vector: model.Vector) -> float:
        x = []
        for param in self.param_list:
            x.append(vector.vector[vector.indices[param]][0])
        return self.func(x)

    def transform(self, u: float | np.ndarray) -> float | np.ndarray:
        if self.transform_func is None:
            raise TypeError("transform_func is None. Set it to a function before calling transform().")
        return self.transform_func(u)

    def __repr__(self) -> str:
        s = "User-defined prior on {}".format(
            self.param_list
            )
        return s

    def __str__(self) -> str:
        s = self.tex_rep
        return s




[docs]
class InformativeBaselinePrior(Prior):
    """ Informative baseline prior suggested
    by A. Vanderburg (see Blunt et al. 2019).

    This prior follows the distribution:

    .. math::
        p(x) \\propto 1\\, \\mathrm{{if}}\\, x-t_{{d}} \\lt B

             \\propto (B+t_{{d}})/x\\, \\mathrm{{else}}

    with upper bound.

    Args:
        param (string): parameter label
        baseline (float): :math:`B` in eq above
        duration (float): :math:`t_{{d}}` in eq above (default: 0.0)

    """

    def __init__(self, param: str, baseline: float, duration: float = 0.0) -> None:
        self.param = param
        self.baseline = baseline
        self.duration = duration

    def __repr__(self) -> str:
        s = "Informative baseline prior on {}, baseline={}, duration={}".format(
            self.param, self.baseline, self.duration
            )
        return s

    def __call__(self, params: model.Parameters, vector: model.Vector) -> float:

        per = vector.vector[vector.indices[self.param]][0]

        if self.param.startswith('logper'):
            per = np.exp(per)

        if (per-self.duration)<=self.baseline:
            return 0.
        else:
            return np.log((self.baseline+self.duration)/per)

    def transform(self, u: float | np.ndarray) -> None:
        # TODO: Implement for this distribution
        raise NotImplementedError("Prior transform not yet implemented InformativeBaselinePrior")