Source code for measure_extinction.model

import copy
import numpy as np
import matplotlib.pyplot as plt
from matplotlib.ticker import ScalarFormatter
import astropy.units as u
from astropy.table import QTable
import scipy.optimize as op

import emcee
import corner
from multiprocessing import Pool

from dust_extinction.parameter_averages import G23
from dust_extinction.shapes import _curve_F99_method


__all__ = ["MEParameter", "MEModel"]


# required to be outside of the class to allow for emcee to be able to run in parallel
def _lnprob(params, memodel, *args):
    memodel.fit_to_parameters(params)
    return memodel.lnprob(*args)



[docs]
class MEParameter(object):
    """
    Provide parameter info in a flexible format.
    Inspired by astropy modeling.
    """

    def __init__(
        self, value=0.0, unc=None, bounds=(None, None), prior=None, fixed=False
    ):
        self.value = value
        self.unc = unc
        # square bounds supported by giving (min, max) as the bounds
        self.bounds = bounds
        # currently only Gaussian priors supports by giving (mean, sigma) as the prior
        self.prior = prior
        self.fixed = fixed




[docs]
class MEModel(object):
    """
    Model object for the measure_extinction fitting.  Includes all parameters and
    useful functions.
    Inspired by astropy modeling.
    """

    # fmt: off
    paramnames = ["logTeff", "logg", "logZ", "vturb", "velocity", "windamp", "windalpha",
                  "Av", "Rv", "C2", "B3", "C4", "xo", "gamma",
                  "vel_MW", "logHI_MW", "fore_Av", "fore_Rv", "vel_exgal", "logHI_exgal",
                  "norm"]
    # fmt: on

    # stellar
    logTeff = MEParameter(value=4.0, bounds=(0.0, 10.0))
    logg = MEParameter(value=3.0, bounds=(0.0, 10.0))
    logZ = MEParameter(value=0.0, bounds=(-1.0, 1.0))
    vturb = MEParameter(value=5.0, bounds=(2.0, 10.0))
    velocity = MEParameter(value=0.0, bounds=[-1000.0, 1000.0], fixed=True)  # km/s
    windamp = MEParameter(value=0.0, bounds=(0.0, 1.0), fixed=True)
    windalpha = MEParameter(value=2.0, bounds=(0.5, 3.5), fixed=True)

    # dust - values, bounds, and priors based on VCG04 and FM07 MW samples (expect Av)
    Av = MEParameter(value=1.0, bounds=(0.0, 100.0))
    Rv = MEParameter(value=3.0, bounds=(2.3, 5.6), prior=(3.0, 0.4))
    C2 = MEParameter(value=0.73, bounds=(-0.1, 5.0), prior=(0.73, 0.25))
    B3 = MEParameter(value=3.6, bounds=(-1.0, 8.0), prior=(3.6, 0.6))
    C4 = MEParameter(value=0.4, bounds=(-0.5, 1.5), prior=(0.4, 0.2))
    xo = MEParameter(value=4.59, bounds=(4.5, 4.9), prior=(4.59, 0.02))
    gamma = MEParameter(value=0.89, bounds=(0.6, 1.7), prior=(0.89, 0.08))

    # gas
    vel_MW = MEParameter(value=0.0, bounds=(-300.0, 300.0))  # km/s
    logHI_MW = MEParameter(value=20.0, bounds=(16.0, 24.0))
    vel_exgal = MEParameter(value=0.0, bounds=(-300.0, 1000.0), fixed=True)  # km/s
    logHI_exgal = MEParameter(value=16.0, bounds=(16.0, 24.0), fixed=True)

    # foreground MW dust parameters (when used, set based on HI and parameters fixed)
    # used to account MW foreground dust extinction when measuring extinction in external galaxies
    fore_Av = MEParameter(value=0.0, bounds=(0.0, 10.0), fixed=True)
    fore_Rv = MEParameter(value=3.1, bounds=(2.3, 5.6), prior=(3.0, 0.4), fixed=True)
    # set to true if campling (e.g., MCMC) to enable sampling the foreground prior
    fore_sampling = False
    # needed for fore_sampling
    rng = np.random.default_rng(123456)

    # normalization value (puts model at the same level as data)
    #   value is depends on the stellar radius and distance
    #   radius would require adding stellar evolutionary track info
    norm = MEParameter(value=1.0)

    # full FM90+optnir fitting (default) or G23 for the full wavelength range
    g23_all_ext = False

    #  bad regions are defined as those were we know the models do not work
    #  or the data is bad
    exclude_regions = [
        [8.23 - 0.05, 8.23 + 0.05],  # geocoronal line
        [8.7, 10.0],  # bad data from STIS
        [3.55, 3.6],
        [3.80, 3.90],
        [4.15, 4.3],
        [6.4, 6.6],
        [7.1, 7.3],
        [7.45, 7.55],
        [7.65, 7.75],
        [7.9, 7.95],
        [8.05, 8.1],
    ] / u.micron

    # some fitters don't like inf, can be changed here
    lnp_bignum = -np.inf

    def __init__(self, modinfo=None, obsdata=None, logf=False):
        """
        Initialize the object, optionally using the min/max of the input model info
        to set the value and bounds on the stellar parameters

        Parameters
        ----------
        modinfo : ModelData object
            all the information about the model spectra

        obsdata : StarData object
            observed data for a reddened star
        """
        if modinfo is not None:
            self.logTeff.bounds = (modinfo.temps_min, modinfo.temps_max)
            self.logTeff.value = np.average(self.logTeff.bounds)
            self.logg.bounds = (modinfo.gravs_min, modinfo.gravs_max)
            self.logg.value = np.average(self.logg.bounds)
            self.logZ.bounds = (modinfo.mets_min, modinfo.mets_max)
            self.logZ.value = np.average(self.logZ.bounds)
            self.vturb.bounds = (modinfo.vturb_min, modinfo.vturb_max)
            self.vturb.value = np.average(self.vturb.bounds)

        # setup the mapping between the observed data and model bands
        self.obsdata_bands = None
        self.obsdata_gvals = None
        if obsdata is not None:
            if "BAND" in obsdata.data.keys():
                obsbands = obsdata.data["BAND"].get_band_names()
                obsbands_gvals = [
                    True if cband in obsbands else False for cband in modinfo.band_names
                ]
                if np.sum(obsbands_gvals) != len(obsbands):
                    print("Model: ", modinfo.band_names)
                    print("  Obs: ", obsbands)
                    raise Exception("Model bands do not include all the observed bands")
                self.obsdata_bands = obsbands
                self.obsdata_gvals = obsbands_gvals

        # setup the fractional underestimation values for each type of data
        #    fittable parameter to handle underestimating uncertainties
        if (obsdata is not None) and logf:
            self.logf = {}
            for cspec in obsdata.data.keys():
                self.logf[cspec] = MEParameter(value=-3.0, bounds=(-9.0, 9.0))


[docs]
    def pprint_parameters(self):
        """
        Print the parameters with names and values
        """
        # line 1
        pnames = [
            ["logTeff", "logg", "logZ", "vturb", "velocity", "windamp", "windalpha"],
            ["Av", "Rv", "C2", "B3", "C4", "xo", "gamma"],
            ["vel_MW", "logHI_MW", "fore_Av", "fore_Rv", "vel_exgal", "logHI_exgal"],
        ]
        for cnames in pnames:
            hline = ""
            tline = ""
            for cname in cnames:
                if getattr(self, cname).fixed:
                    fstr = "F"
                else:
                    fstr = ""
                if getattr(self, cname).prior is not None:
                    fstr = f"{fstr}P"
                hline += f"{cname} "
                tline += f"{getattr(self, cname).value:.3f}{fstr} "
            print(f"{tline[:-1]} ({hline[:-1]})")

        if hasattr(self, "logf"):
            hline = "logf: "
            tline = ""
            for cname in self.logf.keys():
                hline += f"{cname} "
                tline += f"{self.logf[cname].value:.2f} "
            print(f"{tline[:-1]} ({hline[:-1]})")



[docs]
    def parameters(self):
        """
        Give all the parameters values in a vector (fixed or not).

        Returns
        -------
        params : np array
            parameters values
        """
        vals = []
        for cname in self.paramnames:
            vals.append(getattr(self, cname).value)
        if hasattr(self, "logf"):
            for ckey in self.logf.keys():
                vals.append(self.logf[ckey].value)
        return np.array(vals)



[docs]
    def save_parameters(self, filename=None):
        """
        Save the parameters and uncertainties to a table.  Include if they were
        fixed, their bounds, and their priors.

        Parameters
        ----------
        filename : str
            name of the file for the saved info

        Returns
        -------
        otab : astropy table
            table giving the results, often output with the computed extinction curve
        """
        nparams = len(self.paramnames)
        paramuncs = np.zeros(nparams)
        paramfixed = np.zeros(nparams)
        paramprior = np.zeros(nparams)
        paramprior_val = np.zeros(nparams)
        paramprior_unc = np.zeros(nparams)
        for k, cname in enumerate(self.paramnames):
            param = getattr(self, cname)
            if param.unc is not None:
                paramuncs[k] = param.unc
            if param.fixed:
                paramfixed[k] = 1.0
            if param.prior is not None:
                paramprior[k] = 1
                paramprior_val[k] = param.prior[0]
                paramprior_unc[k] = param.prior[1]

        otab = QTable()
        otab["name"] = self.paramnames
        otab["value"] = self.parameters()
        otab["unc"] = paramuncs
        otab["fixed"] = paramfixed
        otab["prior"] = paramprior
        otab["prior_val"] = paramprior_val
        otab["prior_unc"] = paramprior_unc
        if filename is not None:
            otab.write(filename, overwrite=True)

        return otab



[docs]
    def parameters_to_fit(self):
        """
        Give the non-fixed parameters values in a vector.  Needed for most fitters/samplers.

        Returns
        -------
        params : np array
            non-fixed parameters values
        """
        vals = []
        for cname in self.paramnames:
            if not getattr(self, cname).fixed:
                vals.append(getattr(self, cname).value)
        if hasattr(self, "logf"):
            for ckey in self.logf.keys():
                vals.append(self.logf[ckey].value)
        return np.array(vals)



[docs]
    def fit_to_parameters(self, fit_params, uncs=None):
        """
        Set the parameter values based on a vector of the non-fixed values.
        Needed for most fitters/samplers.

        Parameters
        ----------
        fit_params : np array
            non-fixed parameters values
        """
        i = 0
        for cname in self.paramnames:
            cparam = getattr(self, cname)
            if not cparam.fixed:
                cparam.value = fit_params[i]
                if uncs is not None:
                    cparam.unc = uncs[i]
                i += 1
        if hasattr(self, "logf"):
            for ckey in self.logf.keys():
                self.logf[ckey].value = fit_params[i]
                i += 1



[docs]
    def get_nonfixed_paramnames(self):
        """
        Get the non-fixed parameter names.  Useful for plotting.
        """
        names = []
        for cname in self.paramnames:
            cparam = getattr(self, cname)
            if not cparam.fixed:
                names.append(cname)
        if hasattr(self, "logf"):
            for ckey in self.logf.keys():
                if not self.logf[ckey].fixed:
                    names.append(f"logf[{ckey}]")

        return names



[docs]
    def check_param_limits(self):
        """
        Check the parameters are within the parameter bounds
        """
        for cname in self.paramnames:
            pval = getattr(self, cname).value
            pbounds = getattr(self, cname).bounds
            if (pbounds[0] is not None) and (pval < pbounds[0]):
                raise ValueError(
                    f"{cname} = {pval} is below the bounds ({pbounds[0]}, {pbounds[1]})"
                )
            elif (pbounds[1] is not None) and (pval > pbounds[1]):
                raise ValueError(
                    f"{cname} = {pval} is above the bounds ({pbounds[0]}, {pbounds[1]})"
                )
        if hasattr(self, "logf"):
            for ckey in self.logf.keys():
                pval = self.logf[ckey].value
                pbounds = self.logf[ckey].bounds
                if (pbounds[0] is not None) and (pval < pbounds[0]):
                    raise ValueError(
                        f"logf[{ckey}] = {pval} is below the bounds ({pbounds[0]}, {pbounds[1]})"
                    )
                elif (pbounds[1] is not None) and (pval > pbounds[1]):
                    raise ValueError(
                        f"logf[{cname}] = {pval} is above the bounds ({pbounds[0]}, {pbounds[1]})"
                    )



[docs]
    def add_exclude_region(self, exreg):
        """
        Add an exclude region to the list of such regions.

        Parameters
        ----------
        exreg : list
            2 element list with min/max given in 1/micron
        """
        if exreg[0] > exreg[1]:
            raise ValueError(
                "exclude region to be added has [max, min], reverse needed"
            )
        self.exclude_regions = np.append(self.exclude_regions, [exreg], axis=0)



[docs]
    def fit_weights(self, obsdata):
        """
        Compute the weight to be used for fitting.
        Observed data for the base weights 1/unc (expected by fitters).
        Weights in regions known to have data issues or that the models do not include
        are set to zero (e.g., stellar wind lines, geocoronal Ly-alpha)

        Parameters
        ----------
        obsdata : StarData object
            observed data for a reddened star
        """
        self.weights = {}
        for cspec in list(obsdata.data.keys()):
            # base weights
            self.weights[cspec] = np.full(len(obsdata.data[cspec].fluxes), 0.0)
            gvals = (
                (obsdata.data[cspec].npts > 0)
                & np.isfinite(obsdata.data[cspec].fluxes)
                & (obsdata.data[cspec].fluxes.value > 0.0)
                & (obsdata.data[cspec].uncs.value > 0.0)
            )
            self.weights[cspec][gvals] = 1.0 / obsdata.data[cspec].uncs[gvals].value

            if self.exclude_regions is not None:
                x = 1.0 / obsdata.data[cspec].waves
                for cexreg in self.exclude_regions:
                    self.weights[cspec][
                        np.logical_and(x >= cexreg[0], x <= cexreg[1])
                    ] = 0.0



[docs]
    def stellar_sed(self, moddata):
        """
        Compute the stellar SED from the model parameters.

        If foreground dust extinction included, then also includes the
        foreground dust extinction.  Including this here results in extinction
        curves that do not include the foreground extinction.

        Parameters
        ----------
        moddata : ModelData object
            all the information about the model spectra

        Returns
        -------
        sed : dict
            SED with {'bands': band_sed, 'spec': spec_sed, ...}
        """
        # compute the distance between model params and grid points
        #    probably a better way using a kdtree
        dist2 = (
            (self.logTeff.value - moddata.temps) ** 2 / moddata.temps_width2
            + (self.logg.value - moddata.gravs) ** 2 / moddata.gravs_width2
            + (self.logZ.value - moddata.mets) ** 2 / moddata.mets_width2
            + (self.vturb.value - moddata.vturb) ** 2 / moddata.vturb_width2
        )
        sindxs = np.argsort(dist2)
        gsindxs = sindxs[0 : moddata.n_nearest]

        # generate model SED form nearest neighbors
        #   should handle the case where dist2 has an element that is zero
        #   i.e., one of the precomputed models exactly matches the request
        if np.sum(dist2[gsindxs]) > 0:
            # check for any zero distance cases, requested parameters are directly on a model
            # in this case set the distance to 0.01 of the min distance so this model dominates
            tvals = dist2[gsindxs] == 0.0
            if sum(tvals) > 0:
                dist2[gsindxs[tvals]] = 0.01 * np.min(dist2[gsindxs[~tvals]])

            weights = 1.0 / np.sqrt(dist2[gsindxs])
        else:
            weights = np.full(len(gsindxs), 1.0)
        weights /= np.sum(weights)

        if self.fore_Av.value > 0.0:
            if self.fore_sampling:
                tRv = self.rng.normal(loc=self.fore_Rv.prior[0], scale=self.fore_Rv.prior[1])
                tRv = max(self.fore_Rv.bounds[0], min(tRv, self.fore_Rv.bounds[1]))
                tAv = self.rng.normal(loc=self.fore_Av.prior[0], scale=self.fore_Av.prior[1])
                tAv = max(self.fore_Av.bounds[0], min(tAv, self.fore_Av.bounds[1]))
            else:
                tRv = self.fore_Rv.value
                tAv = self.fore_Av.value
            g23mod = G23(Rv=tRv)

        sed = {}
        for cspec in moddata.fluxes.keys():
            # dot product does the multiplication and sum
            sed[cspec] = np.dot(weights, moddata.fluxes[cspec][gsindxs, :])

            sed[cspec][sed[cspec] == 0] = np.nan
            # shift spectrum if velocity given
            if self.velocity.value != 0.0:
                cwaves = moddata.waves[cspec]
                sed[cspec] = np.interp(
                    cwaves, (1.0 + self.velocity.value / 2.998e5) * cwaves, sed[cspec]
                )
            if (self.windamp.value != 0.0) and np.min(
                moddata.waves[cspec] > 1.0 * u.micron
            ):
                cwaves = moddata.waves[cspec].value
                sed[cspec] *= 1.0 + self.windamp.value * (
                    np.power(cwaves, self.windalpha.value)
                    # - np.power(4.0, self.windalpha.value
                )

            if self.fore_Av.value > 0.0:
                axav = g23mod(moddata.waves[cspec])
                sed[cspec] = sed[cspec] * (10 ** (-0.4 * axav * tAv))

            # remove bands not int he observed data
            if (cspec == "BAND") and (self.obsdata_bands is not None):
                sed[cspec] = sed[cspec][self.obsdata_gvals]

        return sed



[docs]
    def dust_extinguished_sed(self, moddata, sed):
        """
        Dust extinguished sed given the extinction parameters

        Parameters
        ----------
        moddata : ModelData object
            all the information about the model spectra

        sed : dict
            fluxes for each spectral piece

        Returns
        -------
        extinguished sed : dict
            SED with {'bands': band_sed, 'spec': spec_sed, ...}
        """
        g23mod = G23()

        # allows for extrapolation outside of bounds for the G23 R(V) relationship
        g23mod.Rv_range = self.Rv.bounds
        g23mod.Rv = self.Rv.value

        # create the extinguished sed
        ext_sed = {}
        if not self.g23_all_ext:
            optnir_axav_x = np.flip(1.0 / (np.arange(0.35, 30.0, 0.1) * u.micron))
            optnir_axav_y = g23mod(optnir_axav_x)

            # updated F04 C1-C2 correlation
            C1 = 2.18 - 2.91 * self.C2.value

        for cspec in moddata.fluxes.keys():
            if cspec != "BAND":
                # get the dust extinguished SED (account for the
                #  systemic velocity of the galaxy [opposite regular sense])
                shifted_waves = (1.0 - self.velocity.value / 2.998e5) * moddata.waves[
                    cspec
                ]

                # convert to 1/micron as _curve_F99_method does not do this (as of Nov 2024)
                with u.add_enabled_equivalencies(u.spectral()):
                    shifted_waves_imicron = u.Quantity(
                        shifted_waves, 1.0 / u.micron, dtype=np.float64
                    )

                if self.g23_all_ext:
                    axav = g23mod(shifted_waves_imicron)
                else:
                    axav = _curve_F99_method(
                        shifted_waves_imicron.value,
                        self.Rv.value,
                        C1,
                        self.C2.value,
                        self.B3.value,
                        self.C4.value,
                        xo=self.xo.value,
                        gamma=self.gamma.value,
                        optnir_axav_x=optnir_axav_x.value,
                        optnir_axav_y=optnir_axav_y,
                        fm90_version="B3",
                    )

                ext_sed[cspec] = sed[cspec] * (10 ** (-0.4 * axav * self.Av.value))

        # update the BAND fluxes by integrating the reddened MODEL_FULL spectrum
        # only do this for the observed bands (model can have many more)
        if "BAND" in moddata.fluxes.keys():
            if self.obsdata_bands is not None:
                tbands = self.obsdata_bands
            else:
                tbands = moddata.band_names
            band_sed = np.zeros(len(tbands))
            for k, cband in enumerate(tbands):
                gvals = np.isfinite(ext_sed["MODEL_FULL_LOWRES"])
                iwave = (1.0 - self.velocity.value / 2.998e5) * moddata.waves[
                    "MODEL_FULL_LOWRES"
                ][gvals]
                iflux = ext_sed["MODEL_FULL_LOWRES"][gvals]
                iresp = moddata.band_resp[cband](iwave)
                # set nans to zero - happens for ACS bands
                iresp[~np.isfinite(iresp)] = 0.0
                inttop = np.trapezoid(iwave * iresp * iflux, iwave)
                intbot = np.trapezoid(iwave * iresp, iwave)
                band_sed[k] = inttop / intbot
            ext_sed["BAND"] = band_sed

        return ext_sed



[docs]
    def hi_abs_sed(self, moddata, sed):
        """
        HI abs sed given the HI columns

        Parameters
        ----------
        moddata : ModelData object
            all the information about the model spectra

        sed : dict
            fluxes for each spectral piece

        Returns
        -------
        hi absorbed sed : dict
            SED with {'bands': band_sed, 'spec': spec_sed, ...}
        """
        # wavelengths of HI lines
        #     only use Ly-alpha right now - others useful later
        h_lines = (
            np.array(
                [
                    1215.0,
                    1025.0,
                    972.0,
                    949.0,
                    937.0,
                    930.0,
                    926.0,
                    923.0,
                    920,
                    919.0,
                    918.0,
                ]
            )
            * u.angstrom
        )
        # width overwhich to compute the HI abs
        h_width = 100.0 * u.angstrom

        hi_sed = {}
        for cspec in moddata.fluxes.keys():
            hi_sed[cspec] = np.copy(sed[cspec])
            (indxs,) = np.where(
                np.absolute((moddata.waves[cspec] - h_lines[0]) <= h_width)
            )
            if len(indxs) > 0:
                logHI_vals = [self.logHI_MW.value, self.logHI_exgal.value]
                for i, cvel in enumerate([self.vel_MW.value, self.vel_exgal.value]):
                    # compute the Ly-alpha abs: from Bohlin et al. (197?)
                    abs_wave = (1.0 + (cvel / 3e5)) * h_lines[0].to(u.micron).value
                    phi = 4.26e-20 / (
                        (
                            1e4
                            * (
                                moddata.waves[cspec][indxs].to(u.micron).value
                                - abs_wave
                            )
                        )
                        ** 2
                        + 6.04e-10
                    )

                    nhi = 10 ** logHI_vals[i]
                    hi_sed[cspec][indxs] = hi_sed[cspec][indxs] * np.exp(
                        -1.0 * nhi * phi
                    )

        return hi_sed



[docs]
    def set_initial_norm(self, obsdata, modeldata):
        """
        Set the initial normalization that puts the current model at the average
        level of the observed data.
        The normalization is a fit parameter, so is included fully in the fitting.

        Parameters
        ----------
        obsdata : StarData object
            observed data for a reddened star

        moddata : ModelData object
            all the information about the model spectra
        """

        # intrinsic sed
        modsed = self.stellar_sed(modeldata)

        # dust extinguished sed
        ext_modsed = self.dust_extinguished_sed(modeldata, modsed)

        # hi absorbed (ly-alpha) sed
        hi_ext_modsed = self.hi_abs_sed(modeldata, ext_modsed)

        # compute the normalization factors for the model and observed data
        # model data normalized to the observations using the ratio
        #   weighted average of the averages of each type of data (photometry or specific spectrum)
        #   allows for all the data to contribute to the normalization
        #   weighting by number of points in each type of data to achieve the highest S/N in
        #     the normalization
        norm_mod = []
        norm_dat = []
        norm_npts = []
        for cspec in obsdata.data.keys():
            gvals = (self.weights[cspec] > 0) & (np.isfinite(hi_ext_modsed[cspec]))
            norm_npts.append(np.sum(gvals))
            norm_mod.append(np.average(hi_ext_modsed[cspec][gvals]))
            norm_dat.append(np.average(obsdata.data[cspec].fluxes[gvals].value))
        norm_model = np.average(norm_mod, weights=norm_npts)
        norm_data = np.average(norm_dat, weights=norm_npts)
        self.norm.value = norm_data / norm_model



[docs]
    def lnlike(self, obsdata, modeldata):
        """
        Compute the natural log of the likelihood that the data
        fits the model.

        Parameters
        ----------
        obsdata : StarData object
            observed data for a reddened star

        moddata : ModelData object
            all the information about the model spectra

        Returns
        -------
        lnp : float
            natural log of the likelihood
        """
        # intrinsic sed
        modsed = self.stellar_sed(modeldata)

        # dust extinguished sed
        ext_modsed = self.dust_extinguished_sed(modeldata, modsed)

        # hi absorbed (ly-alpha) sed
        hi_ext_modsed = self.hi_abs_sed(modeldata, ext_modsed)

        lnl = 0.0
        for cspec in obsdata.data.keys():
            try:
                gvals = (self.weights[cspec] > 0) & (np.isfinite(hi_ext_modsed[cspec]))
            except ValueError:
                raise ValueError(
                    "Oops! The model data and reddened star data did not match.\n Hint: Make sure that the BAND name in the .dat files match."
                )
            model = hi_ext_modsed[cspec][gvals] * self.norm.value

            if hasattr(self, "logf"):
                unc = 1.0 / self.weights[cspec][gvals]
                unc2 = unc**2 + model**2 + np.exp(2.0 * self.logf[cspec].value)
                weights = 1.0 / np.sqrt(unc2)
                lnextra = np.log(unc2)
            else:
                weights = self.weights[cspec][gvals]
                lnextra = 0.0

            chiarr = (
                np.square(((obsdata.data[cspec].fluxes[gvals].value - model) * weights))
                + lnextra
            )
            lnl += -0.5 * np.sum(chiarr)

        return lnl



[docs]
    def lnprior(self):
        """
        Compute the natural log of the priors.
        Only Gaussian priors currently supported.

        Returns
        -------
        lnp : float
            natural log of the prior
        """
        # make sure the parameters are within the limits
        # and compute the ln(prior)
        lnp = 0.0
        for cname in self.paramnames:
            param = getattr(self, cname)
            if not param.fixed:
                pval = param.value
                pbounds = param.bounds
                pprior = param.prior
                if (pbounds[0] is not None) and (pval < pbounds[0]):
                    return self.lnp_bignum
                elif (pbounds[1] is not None) and (pval > pbounds[1]):
                    return self.lnp_bignum
                if pprior is not None:
                    lnp += -0.5 * ((pval - pprior[0]) / pprior[1]) ** 2

        if hasattr(self, "logf"):
            for ckey in self.logf.keys():
                pval = self.logf[ckey].value
                pbounds = self.logf[ckey].bounds
                if (pbounds[0] is not None) and (pval < pbounds[0]):
                    return self.lnp_bignum
                elif (pbounds[1] is not None) and (pval > pbounds[1]):
                    return self.lnp_bignum

        return lnp



[docs]
    def lnprob(self, obsdata, modeldata):
        """
        Compute the natural log of the probability

        Parameters
        ----------
        obsdata : StarData object
            observed data for a reddened star

        moddata : ModelData object
            all the information about the model spectra
        """
        lnp = self.lnprior()
        if lnp == self.lnp_bignum:
            return lnp
        else:
            return lnp + self.lnlike(obsdata, modeldata)



[docs]
    def fit_minimizer(self, obsdata, modinfo, maxiter=1000):
        """
        Run a minimizer (formally an optimizer) to find the best fit parameters
        by finding the minimum chisqr solution.

        Parameters
        ----------
        obsdata : StarData object
            observed data for a reddened star

        moddata : ModelData object
            all the information about the model spectra

        maxiter : int
            maximum number of iterations for the minimizer [default=1000]

        Returns
        -------
        fitmod, result : list
            fitmod is a MEModel with the best fit parameters
            result is the scipy minimizer output
        """
        # make a copy of the model
        outmod = copy.copy(self)

        # check that the parameters are all within the bounds
        self.check_param_limits()

        # check that the initial starting position returns a valid values
        if not np.isfinite(outmod.lnlike(obsdata, modinfo)):
            raise ValueError("ln(likelihood) is not finite")
        if not np.isfinite(outmod.lnprior()):
            raise ValueError("ln(prior) is not finite")

        # simple function to turn the log(likelihood) into the chisqr
        #  required as op.minimize function searches for the minimum chisqr (not max likelihood like MCMC algorithms)
        def nll(params, memodel, *args):
            memodel.fit_to_parameters(params)
            return -memodel.lnprob(*args)

        # get the non-fixed initial parameters
        init_fit_params = outmod.parameters_to_fit()

        # run the fit
        result = op.minimize(
            nll,
            init_fit_params,
            method="Nelder-Mead",
            options={"maxiter": maxiter},
            args=(outmod, obsdata, modinfo),
        )

        # set the best fit parameters in the output model
        outmod.fit_to_parameters(result["x"])

        return (outmod, result)



[docs]
    def fit_sampler(
        self,
        obsdata,
        modinfo,
        nsteps=1000,
        burnfrac=0.5,
        initfrac=0.01,
        save_samples=None,
        multiproc=False,
        resume=False,
    ):
        """
        Run a samplier (specifically emcee) to find the detailed
        parameters including uncertainties.

        Parameters
        ----------
        obsdata : StarData object
            observed data for a reddened star

        moddata : ModelData object
            all the information about the model spectra

        nsteps : int
            number of steps for the samplier chains [default=1000]

        burnfrac : float
            fraction of nsteps to discard as the burn in [default=0.1]

        initfrac : float
            fraction for walker ball around initial position

        save_samples : filename
            name of hd5 file to save the MCMC samples

        multiproc : boolean
            set to run the emcee in parallel (does not speed up things much) [default=False]

        resume : boolean
            resume from previous run (requires save_samples to be an existing emcee hd5 save file)

        Returns
        -------
        fitmod, result : list
            fitmod is a MEModel with the best fit parameters
            result is the scipy minimizer output
        """
        # make a copy of the model
        outmod = copy.copy(self)

        # check that the parameters are all within the bounds
        self.check_param_limits()

        # check that the initial starting position returns a valid values
        if not np.isfinite(outmod.lnlike(obsdata, modinfo)):
            raise ValueError("ln(likelihood) is not finite")
        if not np.isfinite(outmod.lnprior()):
            raise ValueError("ln(prior) is not finite")

        # get the non-fixed initial parameters
        p0 = outmod.parameters_to_fit()

        # setup the sampliers
        ndim = len(p0)
        nwalkers = 2 * ndim

        if not resume:
            # setting up the walkers to start "near" the inital guess
            p = [
                p0 * (1 + initfrac * np.random.normal(0, 1.0, ndim))
                for k in range(nwalkers)
            ]

            # check the value so p to make sure they are within the bounds, set to bounds if not
            for k, cp in enumerate(p):
                for j, cname in enumerate(self.get_nonfixed_paramnames()):
                    param = getattr(self, cname)
                    pval = cp[j]
                    pbounds = param.bounds
                    if (pbounds[0] is not None) and (pval < pbounds[0]):
                        p[k][j] = pbounds[0]
                    elif (pbounds[1] is not None) and (pval > pbounds[1]):
                        p[k][j] = pbounds[1]
        else:
            p = None

        if save_samples:
            # Don't forget to clear it in case the file already exists
            save_backend = emcee.backends.HDFBackend(save_samples)
            if not resume:
                save_backend.reset(nwalkers, ndim)
        else:
            save_backend = None

        # setup and run the sampler
        if multiproc:
            with Pool() as pool:
                sampler = emcee.EnsembleSampler(
                    nwalkers,
                    ndim,
                    _lnprob,
                    args=(outmod, obsdata, modinfo),
                    pool=pool,
                    backgend=save_backend,
                )
                sampler.run_mcmc(p, nsteps, progress=True)
        else:
            sampler = emcee.EnsembleSampler(
                nwalkers,
                ndim,
                _lnprob,
                args=(outmod, obsdata, modinfo),
                backend=save_backend,
            )
            sampler.run_mcmc(p, nsteps, progress=True)

        # create the samples variable for later use
        flat_samples = sampler.get_chain(discard=int(burnfrac * nsteps), flat=True)

        # get the 50 percentile and +/- uncertainties
        params_per = map(
            lambda v: (v[1], v[2] - v[1], v[1] - v[0]),
            zip(*np.percentile(flat_samples, [16, 50, 84], axis=0)),
        )

        # now package the fit parameters into two vectors, averaging the +/- uncs
        n_params = len(p0)
        params_p50 = np.zeros(n_params)
        params_unc = np.zeros(n_params)
        for k, val in enumerate(params_per):
            params_p50[k] = val[0]
            params_unc[k] = 0.5 * (val[1] + val[2])

        # set the best fit parameters in the output model
        outmod.fit_to_parameters(params_p50, uncs=params_unc)

        return (outmod, flat_samples, sampler)



[docs]
    def plot(
        self,
        obsdata,
        modinfo,
        resid_range=10.0,
        lyaplot=False,
        xticks=[0.1, 0.2, 0.3, 0.5, 0.7, 1.0, 2.0],
    ):
        """
        Standard plot showing the data and best fit.

        Parameters
        ----------
        obsdata : StarData object
            observed data for a reddened star

        moddata : ModelData object
            all the information about the model spectra

        resid_range : float
            percentage value for the +/- range for the residual plot

        lyaplot : boolean
            set to add two panels giving the Ly-alpha fit and residuals

        xticks : vector
            set to a vector of floats giving the values for the xticks
        """
        # plotting setup for easier to read plots
        fontsize = 16
        font = {"size": fontsize}
        plt.rc("font", **font)
        plt.rc("lines", linewidth=1)
        plt.rc("axes", linewidth=2)
        plt.rc("xtick.major", width=2)
        plt.rc("xtick.minor", width=2)
        plt.rc("ytick.major", width=2)
        plt.rc("ytick.minor", width=2)

        grating_info = {"STIS_G140L": "indigo",
                        "STIS_G230L": "violet",
                        "STIS_G430L": "blue",
                        "STIS_G750L": "green",
                        "WFC3_G102": "orange",
                        "WFC3_G141": "orangered",
                        "MODEL_FULL_LOWRES": "black"}

        # setup the plot
        if lyaplot:
            ncols = 2
            figsize = (14, 8)
            gs_info = {"height_ratios": [3, 1], "width_ratios": [3, 1]}
        else:
            ncols = 1
            figsize = (10, 8)
            gs_info = {"height_ratios": [3, 1]}

        fig, axes = plt.subplots(
            nrows=2,
            ncols=ncols,
            figsize=figsize,
            gridspec_kw=gs_info,
            sharex=False,
        )
        if lyaplot:
            axes = [axes[0, 0], axes[1, 0], axes[0, 1], axes[1, 1]]
            tax = [axes[0], axes[2]]
            tax_resid = [axes[1], axes[3]]
        else:
            tax = [axes[0]]
            tax_resid = [axes[1]]

        modsed = self.stellar_sed(modinfo)

        if self.fore_Av.value > 0.0:
            save_fore_Av = self.fore_Av.value
            self.fore_Av.value = 0.0
            modsed_nofore = self.stellar_sed(modinfo)
            self.fore_Av.value = save_fore_Av

        ext_modsed = self.dust_extinguished_sed(modinfo, modsed)

        hi_ext_modsed = self.hi_abs_sed(modinfo, ext_modsed)

        ax = axes[0]
        yrange = [100.0, -100.0]
        yrange_lya = [100.0, -100.0]

        first_pass = True
        for cspec in obsdata.data.keys():
            if cspec == "BAND":
                ptype = "o"
                rmarker = "o"
                rcolor = "cyan"
                mline = "none"
            else:
                ptype = "-"
                mline = "-"
                rmarker = "none"
                if cspec not in grating_info.keys():
                    rcolor = "black"
                else:
                    rcolor = grating_info[cspec]

            if cspec == "BAND":
                cwaves = obsdata.data[cspec].waves
            else:
                cwaves = modinfo.waves[cspec]

            # nan models where no data or excluded
            nvals = np.full(len(cwaves), 1.0)
            nvals[self.weights[cspec] == 0.0] = np.nan
            multlam = self.norm.value * np.power(cwaves, 4.0)
            multval = multlam * nvals

            if first_pass:
                plabs = [
                    "Obs",
                    "Star",
                    "w/ Foreground",
                    "w/ Dust Ext",
                    "w/ Dust+Gas Ext",
                ]
            else:
                plabs = [None, None, None, None, None]

            for cax in tax:
                if self.fore_Av.value > 0.0:
                    cax.plot(
                        cwaves, modsed_nofore[cspec] * multlam, "c" + ptype, alpha=0.2
                    )
                    cax.plot(
                        cwaves,
                        modsed_nofore[cspec] * multval,
                        "c" + ptype,
                        label=plabs[1],
                    )
                    cax.plot(
                        cwaves, modsed[cspec] * multval, "b" + ptype, label=plabs[2]
                    )
                else:
                    cax.plot(
                        cwaves, modsed[cspec] * multval, "b" + ptype, label=plabs[1]
                    )
                cax.plot(cwaves, modsed[cspec] * multlam, "b" + ptype, alpha=0.2)
                cax.plot(cwaves, ext_modsed[cspec] * multlam, "g" + ptype, alpha=0.2)
                cax.plot(
                    cwaves, ext_modsed[cspec] * multval, "g" + ptype, label=plabs[3]
                )
                cax.plot(cwaves, hi_ext_modsed[cspec] * multlam, "r" + ptype, alpha=0.2)
                cax.plot(
                    cwaves, hi_ext_modsed[cspec] * multval, "r" + ptype, label=plabs[4]
                )

                gvals = obsdata.data[cspec].fluxes > 0.0
                cax.plot(
                    obsdata.data[cspec].waves[gvals],
                    obsdata.data[cspec].fluxes[gvals]
                    * np.power(obsdata.data[cspec].waves[gvals], 4.0),
                    "k" + ptype,
                    alpha=0.2,
                )
                cax.plot(
                    obsdata.data[cspec].waves * nvals,
                    obsdata.data[cspec].fluxes
                    * np.power(obsdata.data[cspec].waves, 4.0)
                    * nvals,
                    "k" + ptype,
                    label=plabs[0],
                    alpha=0.75,
                )
                first_pass = False

            # plot the residuals
            gvals = hi_ext_modsed[cspec] > 0.0
            modspec = hi_ext_modsed[cspec][gvals] * self.norm.value
            diff = 100.0 * (obsdata.data[cspec].fluxes.value[gvals] - modspec) / modspec
            uncs = 100.0 * obsdata.data[cspec].uncs.value[gvals] / modspec

            nvals = np.full(len(diff), 1.0)
            nvals[(self.weights[cspec])[gvals] == 0.0] = np.nan

            if cspec != "BAND":
                calpha = 0.5
            else:
                calpha = 0.75
            for cax in tax_resid:
                cax.errorbar(
                    cwaves[gvals],
                    diff,
                    yerr=uncs,
                    color=rcolor,
                    marker=rmarker,
                    linestyle=mline,
                    alpha=0.2,
                )
                cax.errorbar(
                    cwaves[gvals] * nvals,
                    diff * nvals,
                    yerr=uncs,
                    color=rcolor,
                    marker=rmarker,
                    linestyle=mline,
                    alpha=calpha,
                )

            # info for y limits of plot - make sure not not include Ly-alpha
            gvals = np.logical_or(
                cwaves > 0.125 * u.micron,
                cwaves < 0.118 * u.micron,
            )
            gvals = np.logical_and(gvals, cwaves > 0.11 * u.micron)
            multval = self.norm.value * np.power(cwaves[gvals], 4.0)
            mflux = (hi_ext_modsed[cspec][gvals] * multval).value
            tyrange = np.log10([np.nanmin(mflux), np.nanmax(mflux)])
            yrange[0] = np.min([tyrange[0], yrange[0]])
            yrange[1] = np.max([tyrange[1], yrange[1]])

            # info for y limits of lya plot
            if lyaplot:
                gvals = np.logical_and(
                    cwaves < 0.140 * u.micron,
                    cwaves > 0.118 * u.micron,
                )
                gvals = np.logical_and(gvals, np.isfinite(hi_ext_modsed[cspec]))
                if np.sum(gvals) > 0:
                    gvals = np.logical_and(gvals, cwaves > 0.11 * u.micron)
                    multval = self.norm.value * np.power(cwaves[gvals], 4.0)
                    mflux = (hi_ext_modsed[cspec][gvals] * multval).value
                    tyrange = np.log10([np.nanmin(mflux), np.nanmax(mflux)])
                    yrange_lya[0] = np.min([tyrange[0], yrange_lya[0]])
                    yrange_lya[1] = np.max([tyrange[1], yrange_lya[1]])

        tax[0].legend(ncol=2, fontsize=0.7 * fontsize)

        ax.set_xscale("log")
        axes[1].set_xscale("log")
        ax.set_yscale("log")

        if xticks is not None:
            for tax in [ax, axes[1]]:
                tax.xaxis.set_major_formatter(ScalarFormatter())
                tax.xaxis.set_minor_formatter(ScalarFormatter())
                tax.set_xticks(xticks, minor=True)
                tax.tick_params(axis="x", which="minor", labelsize=fontsize * 0.8)

        ydelt = yrange[1] - yrange[0]
        yrange[0] = 10 ** (yrange[0] - 0.1 * ydelt)
        yrange[1] = 10 ** (yrange[1] + 0.1 * ydelt)
        ax.set_ylim(yrange)

        if lyaplot:
            if np.isfinite(yrange_lya[1]):
                maxr = 10 ** yrange_lya[1]
            else:
                maxr = 1.0
            axes[2].set_ylim(0.0, maxr)
            axes[2].set_xlim(0.115, 0.13)
            axes[3].set_xlim(0.115, 0.13)
            axes[3].set_ylim(-1.0 * resid_range, resid_range)
            axes[3].axhline(0.0, color="k", linestyle=":")
            axes[3].set_xlabel(r"$\lambda$ [$\mu m$]", fontsize=1.3 * fontsize)

        axes[1].set_xlabel(r"$\lambda$ [$\mu m$]", fontsize=1.3 * fontsize)
        ax.set_ylabel(r"$\lambda^4 F(\lambda)$ [RJ units]", fontsize=1.3 * fontsize)
        axes[1].set_ylabel("residuals [%]", fontsize=1.0 * fontsize)
        ax.tick_params("both", length=10, width=2, which="major")
        ax.tick_params("both", length=5, width=1, which="minor")
        axes[1].set_ylim(-1.0 * resid_range, resid_range)
        axes[1].axhline(0.0, color="k", linestyle=":")

        k = 0
        for cname in self.paramnames:
            param = getattr(self, cname)
            if not param.fixed and (cname != "norm"):
                if param.unc is not None:
                    ptxt = rf"{cname} = ${param.value:.3f} \pm {param.unc:.3f}$"
                else:
                    ptxt = f"{cname} = {param.value:.3f}"
                ax.text(
                    0.65,
                    0.7 - k * 0.0325,
                    ptxt,
                    horizontalalignment="left",
                    verticalalignment="center",
                    transform=ax.transAxes,
                    fontsize=0.7 * fontsize,
                )
                k += 1

        # ax.text(0.1, 0.9, obsdata.file, transform=ax.transAxes, fontsize=fontsize)
        ax.set_title((obsdata.file).replace(".dat", ""), fontsize=fontsize)

        fig.tight_layout()

        return fig



[docs]
    def plot_sampler_chains(self, sampler):
        """
        Plot the samplier chains.

        Parameters
        ----------
        sampler : object
            emcee sampler object

        Returns
        -------
        fig : object
            returns the standard matplotlib fig info
        """

        samples = sampler.get_chain()
        fig, axes = plt.subplots(samples.shape[2], figsize=(10, 15), sharex=True)
        labels = self.get_nonfixed_paramnames()
        for i in range(samples.shape[2]):
            ax = axes[i]
            ax.plot(samples[:, :, i], "k", alpha=0.3)
            ax.set_xlim(0, len(samples))
            ax.set_ylabel(labels[i])
            ax.yaxis.set_label_coords(-0.1, 0.5)

        axes[-1].set_xlabel("step number")

        return fig



[docs]
    def plot_sampler_corner(self, flat_samples):
        """
        Plot the standard corner plot.

        Returns
        -------
        fig : object
            returns the standard matplotlib fig info
        """
        labels = self.get_nonfixed_paramnames()
        fig = corner.corner(
            flat_samples, labels=labels, show_title=True, quantiles=[0.16, 0.5, 0.84]
        )

        return fig
Navigation

Source code for measure_extinction.model