Source code for niriss_tools.grism.specgen

"""
Functions and classes for generating specific types of model spectra.
"""

import warnings
from copy import deepcopy
from functools import partial
from multiprocessing import Pool
from pathlib import Path

import bagpipes
import h5py
import numpy as np
import spectres
from bagpipes import config, filters, utils
from bagpipes.input.spectral_indices import measure_index
from bagpipes.models import chemical_enrichment_history
from bagpipes.models import model_galaxy as BagpipesModelGalaxy
from bagpipes.models import star_formation_history as BagpipesSFH
from bagpipes.models.agn_model import agn
from bagpipes.models.dust_attenuation_model import dust_attenuation
from bagpipes.models.dust_emission_model import dust_emission
from bagpipes.models.igm_model import igm

# from bagpipes.models.agn_model import agn
from bagpipes.models.nebular_model import nebular
from bagpipes.models.stellar_model import stellar
from grizli.utils_numba.interp import interp_conserve_c
from numpy.typing import ArrayLike
from tqdm import tqdm

__all__ = [
    "ExtendedModelGalaxy",
    "CLOUDY_LINE_MAP",
    "check_coverage",
    "NIRISS_050_FILTER_LIMITS",
    "NIRISS_001_FILTER_LIMITS",
    "BagpipesSampler",
]

CLOUDY_LINE_MAP = [
    # Paschen series
    {
        "cloudy": [
            "H  1  1.87510m",
        ],
        "grizli": "PaA",
        "wave": 18756.3,
    },
    {
        "cloudy": [
            "H  1  1.28181m",
        ],
        "grizli": "PaB",
        "wave": 12821.7,
    },
    {
        "cloudy": [
            "H  1  1.09381m",
        ],
        "grizli": "PaG",
        "wave": 10941.2,
    },
    {
        "cloudy": [
            "H  1  1.00494m",
        ],
        "grizli": "PaD",
        "wave": 10052.2,
    },
    # Balmer Series
    {
        "cloudy": [
            "H  1  6562.80A",
            "N  2  6583.45A",
            "N  2  6548.05A",
        ],
        "grizli": "Ha",
        "wave": 6564.697,
    },
    {
        "cloudy": ["H  1  4861.32A"],
        "grizli": "Hb",
        "wave": 4862.738,
    },
    # {
    #     "cloudy": ["H  1  4340.46A"],
    #     "grizli": "Hg",
    #     "wave": 4341.731,
    # },
    # {
    #     "cloudy": ["H  1  4101.73A"],
    #     "grizli": "Hd",
    #     "wave": 4102.936,
    # },
    # # Oxygen
    {
        "cloudy": [
            "O  3  5006.84A",
        ],
        "grizli": "OIII-5007",
        "wave": 5008.240,
    },
    {
        "cloudy": [
            "O  3  4958.91A",
        ],
        "grizli": "OIII-4959",
        "wave": 4960.295,
    },
    {
        "cloudy": ["O  3  4363.21A"],
        "grizli": "OIII-4363",
        "wave": 4364.436,
    },
    {
        "cloudy": [
            "O  2  3726.03A",
            "O  2  3728.81A",
        ],
        "grizli": "OII",
        "wave": 3728.48,
    },
    # Sulphur
    {
        "cloudy": [
            "S  3  9530.62A",
        ],
        "grizli": "SIII-9530",
        "wave": 9530.62,
    },
    {
        "cloudy": [
            "S  3  9068.62A",
        ],
        "grizli": "SIII-9068",
        "wave": 9068.62,
    },
    {
        "cloudy": [
            "S  2  6730.82A",
            "S  2  6716.44A",
        ],
        "grizli": "SII",
        "wave": 6725.48,
    },
    {
        "cloudy": [
            "S  3  6312.06A",
        ],
        "grizli": "SIII-6314",
        "wave": 6313.81,
    },
    # Helium
    {
        "cloudy": [
            "Blnd  1.08302m",
        ],
        "grizli": "HeI-1083",
        "wave": 10830.3,
    },
    {
        "cloudy": [
            "Blnd  5875.66A",
        ],
        "grizli": "HeI-5877",
        "wave": 5877.249,
    },
    {
        "cloudy": [
            "He 1  3888.64A",
        ],
        "grizli": "HeI-3889",
        "wave": 3889.75,
    },
    {
        "cloudy": [
            "Ne 3  3868.76A",
        ],
        "grizli": "NeIII-3867",
        "wave": 3869.87,
    },
]

# In Angstroms
NIRISS_050_FILTER_LIMITS = {
    # "F090W": [7960, 10050],
    "F115W": [10130, 12830],
    "F150W": [13300, 16710],
    "F200W": [17510, 22260],
}

NIRISS_001_FILTER_LIMITS = {
    # "F090W": [7960, 10050],
    "F115W": [10010, 12930],
    "F150W": [13200, 16810],
    "F200W": [17380, 22420],
}



[docs]
def check_coverage(
    obs_wavelength: float, filter_limits: dict = NIRISS_001_FILTER_LIMITS
):
    """
    Check if a line is covered by the NIRISS filters.

    Parameters
    ----------
    obs_wavelength : float
        The observed wavelength of the line.
    filter_limits : dict, optional
        A dictionary, where the keys are the names of the grism filters,
        and the values are array-like, containing
        ``[min_wavelength, max_wavelength]``. Defaults to
        ``NIRISS_FILTER_LIMITS``.

    Returns
    -------
    bool
        ``True`` if the line falls within the filter coverage, else
        ``False``.
    """

    obs_wavelength = np.atleast_1d(obs_wavelength)
    covered = np.zeros((len(filter_limits), *obs_wavelength.shape), dtype=bool)
    for i, (k, v) in enumerate(filter_limits.items()):
        covered[i] = (obs_wavelength >= v[0]) & (obs_wavelength <= v[-1])
    return np.bitwise_or.reduce(covered, axis=0)



class ExtendedSFH(BagpipesSFH):
    """
    An extended version of `bagpipes.star_formation_history`.
    """

    def update(self, model_components: dict, fast_spec_only: bool = False):
        """
        Update the SFH.

        Parameters
        ----------
        model_components : dict
            The new components of the model galaxy.
        fast_spec_only : bool, optional
            Only perform the operations necessary to generate a model
            spectrum (i.e. do not calculate derived quantities). By
            default False.
        """

        self.model_components = model_components
        self.redshift = self.model_components["redshift"]

        self.sfh = np.zeros_like(self.ages)  # Star-formation history

        self.unphysical = False
        self.age_of_universe = 10**9 * np.interp(
            self.redshift, utils.z_array, utils.age_at_z
        )

        # Calculate the star-formation history for each of the components.
        for i in range(len(self.components)):

            name = self.components[i]
            func = self.components[i]

            if name not in dir(self):
                func = name[:-1]

            self.component_sfrs[name] = np.zeros_like(self.ages)
            self.component_weights[name] = np.zeros_like(config.age_sampling)

            getattr(self, func)(self.component_sfrs[name], self.model_components[name])

            # Normalise to the correct mass.
            mass_norm = np.sum(self.component_sfrs[name] * self.age_widths)
            desired_mass = 10 ** self.model_components[name]["massformed"]

            self.component_sfrs[name] *= desired_mass / mass_norm
            self.sfh += self.component_sfrs[name]

            # Sum up contributions to each age bin to create SSP weights
            weights = self.component_sfrs[name] * self.age_widths
            self.component_weights[name] = np.histogram(
                self.ages, bins=config.age_bins, weights=weights
            )[0]
        # Check no stars formed before the Big Bang.
        if self.sfh[self.ages > self.age_of_universe].max() > 0.0:
            self.unphysical = True

        # ceh: Chemical enrichment history object
        self.ceh = chemical_enrichment_history(
            self.model_components, self.component_weights
        )

        if not fast_spec_only:
            self._calculate_derived_quantities()



[docs]
class ExtendedModelGalaxy(BagpipesModelGalaxy):
    """
    An extension of `bagpipes.models.model_galaxy`.

    This class allows a model spectrum to be generated, with one or more
    nebular emission lines excluded.

    Parameters
    ----------
    model_components : dict
        A dictionary containing information about the model you wish to
        generate.
    filt_list : list, optional
        A list of paths to filter curve files, which should contain a
        column of wavelengths in angstroms followed by a column of
        transmitted fraction values. Only required if photometric output
        is desired.
    spec_wavs : array,optional
        An array of wavelengths at which spectral fluxes should be
        returned. Only required of spectroscopic output is desired.
    spec_units : str, optional
        The units the output spectrum will be returned in. Default is
        "ergscma" for ergs per second per centimetre squared per
        angstrom, can also be set to "mujy" for microjanskys.
    phot_units : str, optional
        The units the output photometry will be returned in. Default is
        "ergscma" for ergs per second per centimetre squared per
        angstrom, can also be set to "mujy" for microjanskys.
    index_list : list, optional
        A list of dicts containining definitions for spectral indices.
    """

    def __init__(
        self,
        model_components,
        filt_list=None,
        spec_wavs=None,
        spec_units="ergscma",
        phot_units="ergscma",
        index_list=None,
    ):

        if (spec_wavs is not None) and (index_list is not None):
            raise ValueError("Cannot specify both spec_wavs and index_list.")

        if model_components["redshift"] > config.max_redshift:
            raise ValueError(
                "Bagpipes attempted to create a model with too "
                "high redshift. Please increase max_redshift in "
                "bagpipes/config.py before making this model."
            )

        self.spec_wavs = spec_wavs
        self.filt_list = filt_list
        self.spec_units = spec_units
        self.phot_units = phot_units
        self.index_list = index_list

        if self.index_list is not None:
            self.spec_wavs = self._get_index_spec_wavs(model_components)

        # Create a filter_set object to manage the filter curves.
        if filt_list is not None:
            self.filter_set = filters.filter_set(filt_list)

        # Calculate the optimal wavelength sampling for the model.
        self.wavelengths = self._get_wavelength_sampling()

        # Resample the filter curves onto wavelengths.
        if filt_list is not None:
            self.filter_set.resample_filter_curves(self.wavelengths)

        # Set up a filter_set for calculating rest-frame UVJ magnitudes.
        uvj_filt_list = np.loadtxt(
            utils.install_dir + "/filters/UVJ.filt_list", dtype="str"
        )

        self.uvj_filter_set = filters.filter_set(uvj_filt_list)
        self.uvj_filter_set.resample_filter_curves(self.wavelengths)

        # Create relevant physical models.
        self.sfh = ExtendedSFH(model_components)
        self.stellar = stellar(self.wavelengths)
        self.igm = igm(self.wavelengths)
        self.nebular = False
        self.dust_atten = False
        self.agn_dust_atten = False
        self.dust_emission = False
        self.agn = False

        if "nebular" in list(model_components):
            if "velshift" not in model_components["nebular"]:
                model_components["nebular"]["velshift"] = 0.0

            self.nebular = nebular(
                self.wavelengths, model_components["nebular"]["velshift"]
            )

            if "metallicity" in list(model_components["nebular"]):
                self.neb_sfh = ExtendedSFH(model_components)

        if "dust" in list(model_components):
            self.dust_emission = dust_emission(self.wavelengths)
            self.dust_atten = dust_attenuation(
                self.wavelengths, model_components["dust"]
            )

        if "agn_dust" in list(model_components):
            self.agn_dust_atten = dust_attenuation(
                self.wavelengths, model_components["agn_dust"]
            )

        if "agn" in list(model_components):
            self.agn = agn(self.wavelengths)

        self.update(model_components)


[docs]
    def update(
        self,
        model_components: dict,
        cont_only: bool = False,
        rm_line: list[str] | None = None,
        fast_spec_only: bool = True,
    ):
        """
        Update the model outputs based on ``model_components``.

        Update the model outputs to reflect new parameter values in
        the model_components dictionary. Note that only the changing of
        numerical values is supported.

        Parameters
        ----------
        model_components : dict
            A dictionary containing information about the model to be
            generated.
        cont_only : bool, optional
            Generate only the continuum spectra, with no nebular emission
            at all. By default ``False``.
        rm_line : list[str] | None, optional
            The names of one or more lines to exclude from the model
            spectrum, based on the `Cloudy <https://www.nublado.org/>`__
            naming convention (see `here
            <https://bagpipes.readthedocs.io/en/latest/model_galaxies.html#getting-observables-line-fluxes>`__
            for more details). By default ``None``.
        fast_spec_only : bool, optional
            Only perform the operations necessary to generate a model
            spectrum (i.e. do not calculate derived quantities). By
            default False.
        """

        self.model_comp = model_components
        self.sfh.update(model_components, fast_spec_only)
        if self.dust_atten:
            self.dust_atten.update(model_components["dust"])
        if self.agn_dust_atten:
            self.agn_dust_atten.update(model_components["agn_dust"])

        # If the SFH is unphysical do not caclulate the full spectrum
        if self.sfh.unphysical:
            warnings.warn(
                "The requested model includes stars which formed "
                "before the Big Bang, no spectrum generated.",
                RuntimeWarning,
            )

            self.spectrum_full = np.zeros_like(self.wavelengths)
            self.uvj = np.zeros(3)

        else:
            self._calculate_full_spectrum(
                model_components,
                cont_only=cont_only,
                rm_line=rm_line,
                fast_spec_only=fast_spec_only,
            )

        if self.spec_wavs is not None:
            self._calculate_spectrum(model_components)

        # Add any AGN component:
        if self.agn:
            self.agn.update(self.model_comp["agn"])
            agn_spec = self.agn.spectrum
            agn_spec *= self.igm.trans(self.model_comp["redshift"])

            if self.agn_dust_atten:
                agn_trans = 10 ** (
                    -self.model_comp["agn_dust"]["Av"]
                    * self.agn_dust_atten.A_cont
                    / 2.5
                )
                agn_spec *= agn_trans

            self.spectrum_full += agn_spec / (1.0 + self.model_comp["redshift"])

            if self.spec_wavs is not None:
                zplus1 = self.model_comp["redshift"] + 1.0
                agn_interp = np.interp(
                    self.spec_wavs,
                    self.wavelengths * zplus1,
                    agn_spec / zplus1,
                    left=0,
                    right=0,
                )

                self.spectrum[:, 1] += agn_interp

        if not fast_spec_only:

            if self.filt_list is not None:
                self._calculate_photometry(model_components["redshift"])

            if not self.sfh.unphysical:
                self._calculate_uvj_mags()

            # Deal with any spectral index calculations.
            if self.index_list is not None:
                self.index_names = [ind["name"] for ind in self.index_list]

                self.indices = np.zeros(len(self.index_list))
                for i in range(self.indices.shape[0]):
                    self.indices[i] = measure_index(
                        self.index_list[i], self.spectrum, model_components["redshift"]
                    )


    def _calculate_full_spectrum(
        self,
        model_comp: dict,
        cont_only: bool = True,
        rm_line: list[str] | str | None = None,
        fast_spec_only: bool = True,
    ):
        """
        Calculate a full model spectrum given a set of model components.

        This method combines the models for the various emission
        and absorption processes to generate the internal full galaxy
        spectrum held within the class. The `_calculate_photometry` and
        `_calculate_spectrum` methods generate observables using this
        internal full spectrum.

        Parameters
        ----------
        model_comp : dict
            A dictionary containing information about the model to be
            generated.
        cont_only : bool, optional
            Generate only the continuum spectra, with no nebular emission
            at all. By default ``False``.
        rm_line : list[str] | None, optional
            The names of one or more lines to exclude from the model
            spectrum, based on the `Cloudy <https://www.nublado.org/>`__
            naming convention (see `here
            <https://bagpipes.readthedocs.io/en/latest/model_galaxies.html#getting-observables-line-fluxes>`__
            for more details). By default ``None``.
        fast_spec_only : bool, optional
            Only perform the operations necessary to generate a model
            spectrum (i.e. do not calculate derived quantities). By
            default False.
        """

        t_bc = 0.01
        if "t_bc" in list(model_comp):
            t_bc = model_comp["t_bc"]

        spectrum_bc, spectrum = self.stellar.spectrum(self.sfh.ceh.grid, t_bc)
        em_lines = np.zeros(config.line_wavs.shape)

        if self.nebular and not cont_only:
            grid = np.copy(self.sfh.ceh.grid)

            if "metallicity" in list(model_comp["nebular"]):
                nebular_metallicity = model_comp["nebular"]["metallicity"]
                neb_comp = deepcopy(model_comp)
                for comp in list(neb_comp):
                    if isinstance(neb_comp[comp], dict):
                        neb_comp[comp]["metallicity"] = nebular_metallicity

                self.neb_sfh.update(neb_comp, fast_spec_only)
                grid = self.neb_sfh.ceh.grid

            em_lines += self.nebular.line_fluxes(
                grid, t_bc, model_comp["nebular"]["logU"]
            )

            # Stellar light below 912A is converted to nebular emission
            if "fesc" in list(model_comp["nebular"]):
                f_esc = model_comp["nebular"]["fesc"]
            else:
                f_esc = 0.0

            spectrum_bc[self.wavelengths < 912.0] *= f_esc
            logU = model_comp["nebular"]["logU"]
            spectrum_bc += (1 - f_esc) * self.nebular.spectrum(grid, t_bc, logU)

            if rm_line is not None:
                rm_line = np.atleast_1d(rm_line).ravel()
                for rm in rm_line:
                    rm_line_idx = np.argwhere(config.line_names == rm)

                    line_wav_shift = config.line_wavs[rm_line_idx] * (
                        1 + (model_comp["nebular"].get("velshift", 0) / (3 * 10**5))
                    )
                    ind = np.abs(self.wavelengths - line_wav_shift).argmin()
                    if ind != 0 and ind != self.wavelengths.shape[0] - 1:
                        width = (
                            self.wavelengths[ind + 1] - self.wavelengths[ind - 1]
                        ) / 2
                        spectrum_bc[ind] -= em_lines[rm_line_idx] / width

        # Add attenuation due to stellar birth clouds.
        if self.dust_atten:
            dust_flux = 0.0  # Total attenuated flux for energy balance.

            # Add extra attenuation to birth clouds.
            eta = 1.0
            if "eta" in list(model_comp["dust"]):
                eta = model_comp["dust"]["eta"]
                bc_Av_reduced = (eta - 1.0) * model_comp["dust"]["Av"]
                bc_trans_red = 10 ** (-bc_Av_reduced * self.dust_atten.A_cont / 2.5)
                if self.dust_atten.type == "VW07":
                    bc_trans_red = 10 ** (
                        -bc_Av_reduced * self.dust_atten.A_cont_bc / 2.5
                    )
                else:
                    bc_trans_red = 10 ** (-bc_Av_reduced * self.dust_atten.A_cont / 2.5)
                spectrum_bc_dust = spectrum_bc * bc_trans_red
                dust_flux += np.trapz(
                    spectrum_bc - spectrum_bc_dust, x=self.wavelengths
                )

                spectrum_bc = spectrum_bc_dust

            # Attenuate emission line fluxes.
            if self.dust_atten.type == "VW07":
                Av = model_comp["dust"]["Av"]
                # Apply birth cloud attenuation first
                em_lines *= 10 ** (-bc_Av_reduced * self.dust_atten.A_line_bc / 2.5)
                # Then apply general ISM attenuation
                em_lines *= 10 ** (-Av * self.dust_atten.A_line_ism / 2.5)

            else:
                bc_Av = eta * model_comp["dust"]["Av"]
                em_lines *= 10 ** (-bc_Av * self.dust_atten.A_line / 2.5)

        spectrum += spectrum_bc  # Add birth cloud spectrum to spectrum.

        # Add attenuation due to the diffuse ISM.
        if self.dust_atten:
            trans = 10 ** (-model_comp["dust"]["Av"] * self.dust_atten.A_cont / 2.5)
            dust_spectrum = spectrum * trans
            dust_flux += np.trapz(spectrum - dust_spectrum, x=self.wavelengths)

            spectrum = dust_spectrum
            self.spectrum_bc = spectrum_bc * trans

            # Add dust emission.
            qpah, umin, gamma = 2.0, 1.0, 0.01
            if "qpah" in list(model_comp["dust"]):
                qpah = model_comp["dust"]["qpah"]

            if "umin" in list(model_comp["dust"]):
                umin = model_comp["dust"]["umin"]

            if "gamma" in list(model_comp["dust"]):
                gamma = model_comp["dust"]["gamma"]

            spectrum += dust_flux * self.dust_emission.spectrum(qpah, umin, gamma)

        spectrum *= self.igm.trans(model_comp["redshift"])

        if "dla" in list(model_comp):
            if "redshift" in list(model_comp["dla"]):
                wavelengths_DLA_rest = (
                    self.wavelengths
                    * (1.0 + model_comp["redshift"])
                    / (1.0 + model_comp["dla"]["redshift"])
                )
            else:
                wavelengths_DLA_rest = self.wavelengths
            self.dla_trans = dla_trans(
                wavelengths_DLA_rest,
                N_HI=10 ** model_comp["dla"]["logN_HI"],
                T=model_comp["dla"]["T"],
                b_turb=(
                    model_comp["dla"]["b_turb"]
                    if "b_turb" in list(model_comp["dla"])
                    else 0.0
                ),
            )
            spectrum *= self.dla_trans
            if self.dust_atten:
                self.spectrum_bc *= self.dla_trans

        if self.dust_atten:
            self.spectrum_bc *= self.igm.trans(model_comp["redshift"])

        # Convert from luminosity to observed flux at redshift z.
        self.lum_flux = 1.0
        if model_comp["redshift"] > 0.0:
            ldist_cm = (
                3.086
                * 10**24
                * np.interp(
                    model_comp["redshift"],
                    utils.z_array,
                    utils.ldist_at_z,
                    left=0,
                    right=0,
                )
            )

            self.lum_flux = 4 * np.pi * ldist_cm**2

        spectrum /= self.lum_flux * (1.0 + model_comp["redshift"])

        if self.dust_atten:
            self.spectrum_bc /= self.lum_flux * (1.0 + model_comp["redshift"])

        em_lines /= self.lum_flux

        # convert to erg/s/A/cm^2, or erg/s/A if redshift = 0.
        spectrum *= 3.826 * 10**33

        if self.dust_atten:
            self.spectrum_bc *= 3.826 * 10**33

        em_lines *= 3.826 * 10**33

        self.line_fluxes = dict(zip(config.line_names, em_lines))

        self.spectrum_full = spectrum

    def _calculate_spectrum(self, model_comp):
        """
        This method generates predictions for observed spectroscopy.

        It optionally applies a Gaussian velocity dispersion then
        resamples onto the specified set of observed wavelengths.
        It has been modified to use vacuum wavelengths before the final
        resampling stage.

        """

        zplusone = model_comp["redshift"] + 1.0

        if "veldisp" in list(model_comp):
            vres = 3 * 10**5 / config.R_spec / 2.0
            sigma_pix = model_comp["veldisp"] / vres
            k_size = 4 * int(sigma_pix + 1)
            x_kernel_pix = np.arange(-k_size, k_size + 1)

            kernel = np.exp(-(x_kernel_pix**2) / (2 * sigma_pix**2))
            kernel /= np.trapz(kernel)  # Explicitly normalise kernel

            spectrum = np.convolve(self.spectrum_full, kernel, mode="valid")
            redshifted_wavs = zplusone * self.wavelengths[k_size:-k_size]

        else:
            spectrum = self.spectrum_full
            redshifted_wavs = zplusone * self.wavelengths

        if "R_curve" in list(model_comp):
            oversample = 4  # Number of samples per FWHM at resolution R
            new_wavs = self._get_R_curve_wav_sampling(oversample=oversample)

            # spectrum = np.interp(new_wavs, redshifted_wavs, spectrum)
            spectrum = spectres.spectres(new_wavs, redshifted_wavs, spectrum, fill=0)
            redshifted_wavs = new_wavs

            sigma_pix = oversample / 2.35  # sigma width of kernel in pixels
            k_size = 4 * int(sigma_pix + 1)
            x_kernel_pix = np.arange(-k_size, k_size + 1)

            kernel = np.exp(-(x_kernel_pix**2) / (2 * sigma_pix**2))
            kernel /= np.trapz(kernel)  # Explicitly normalise kernel

            # Disperse non-uniformly sampled spectrum
            spectrum = np.convolve(spectrum, kernel, mode="valid")
            redshifted_wavs = redshifted_wavs[k_size:-k_size]

        # Converted to using spectres in response to issue with interp,
        # see https://github.com/ACCarnall/bagpipes/issues/15
        # fluxes = np.interp(self.spec_wavs, redshifted_wavs,
        #                    spectrum, left=0, right=0)

        vac_redshifted_wavs = self.air_to_vac(redshifted_wavs)
        # fluxes = spectres.spectres(
        #     self.spec_wavs, vac_redshifted_wavs, spectrum, fill=0
        # )
        fluxes = interp_conserve_c(self.spec_wavs, vac_redshifted_wavs, spectrum)

        if self.spec_units == "mujy":
            fluxes /= 10**-29 * 2.9979 * 10**18 / self.spec_wavs**2

        self.spectrum = np.c_[self.spec_wavs, fluxes]


[docs]
    @staticmethod
    def air_to_vac(wavelength: ArrayLike):
        """
        Convert air to vacuum wavelengths.

        Implements the air to vacuum wavelength conversion described in eqn 65 of
        Griesen 2006.

        TODO: check against most recent specutils conversions.

        Parameters
        ----------
        wavelength : ArrayLike
            The wavelengths in Angstroms.
        """
        # wlum = wavelength.to(u.um).value
        wlum = wavelength[wavelength >= 2e4] / 1e4
        wavelength[wavelength >= 2e4] = (
            1 + 1e-6 * (287.6155 + 1.62887 / wlum**2 + 0.01360 / wlum**4)
        ) * wavelength[wavelength >= 2e4]
        return wavelength





[docs]
class BagpipesSampler(object):
    """
    Bagpipes model galaxy sampler.

    Parameters
    ----------
    fit_instructions : dict
        A dictionary containing information about the model to be
        generated.
    veldisp : float, optional
        The velocity dispersion of the model galaxy in km/s. By default
        ``veldisp=500``.
    """

    def __init__(self, fit_instructions: dict, veldisp: float = 500.0):

        self.fit_instructions = deepcopy(fit_instructions)
        self.model_components = deepcopy(fit_instructions)
        self.model_components["veldisp"] = veldisp

        # self._set_constants()
        self._process_fit_instructions()
        self.model_gal = None
        # print (fit_instructions)

    def _process_fit_instructions(self) -> None:
        """
        Load the fit instructions and populate the class attributes.

        Originally from `bagpipes.fitting.fitted_model`.
        """
        all_keys = []  # All keys in fit_instructions and subs
        all_vals = []  # All vals in fit_instructions and subs

        self.params = []  # Parameters to be fitted
        self.limits = []  # Limits for fitted parameter values
        self.pdfs = []  # Probability densities within lims
        self.hyper_params = []  # Hyperparameters of prior distributions
        self.mirror_pars = {}  # Params which mirror a fitted param

        # Flatten the input fit_instructions dictionary.
        for key in list(self.fit_instructions):
            if not isinstance(self.fit_instructions[key], dict):
                all_keys.append(key)
                all_vals.append(self.fit_instructions[key])

            else:
                for sub_key in list(self.fit_instructions[key]):
                    all_keys.append(key + ":" + sub_key)
                    all_vals.append(self.fit_instructions[key][sub_key])

        # Sort the resulting lists alphabetically by parameter name.
        indices = np.argsort(all_keys)
        all_vals = [all_vals[i] for i in indices]
        all_keys.sort()

        # Find parameters to be fitted and extract their priors.
        for i in range(len(all_vals)):
            # R_curve cannot be fitted and is either unset or must be a 2D numpy array
            if not all_keys[i] == "R_curve":
                if isinstance(all_vals[i], tuple):
                    self.params.append(all_keys[i])
                    self.limits.append(all_vals[i])  # Limits on prior.

                    # Prior probability densities between these limits.
                    prior_key = all_keys[i] + "_prior"
                    if prior_key in list(all_keys):
                        self.pdfs.append(all_vals[all_keys.index(prior_key)])

                    else:
                        self.pdfs.append("uniform")

                    # Any hyper-parameters of these prior distributions.
                    self.hyper_params.append({})
                    for i in range(len(all_keys)):
                        if all_keys[i].startswith(prior_key + "_"):
                            hyp_key = all_keys[i][len(prior_key) + 1 :]
                            self.hyper_params[-1][hyp_key] = all_vals[i]

                # Find any parameters which mirror the value of a fit param.
                if all_vals[i] in all_keys:
                    self.mirror_pars[all_keys[i]] = all_vals[i]

                if all_vals[i] == "dirichlet":
                    n = all_vals[all_keys.index(all_keys[i][:-6])]
                    comp = all_keys[i].split(":")[0]
                    for j in range(1, n):
                        self.params.append(comp + ":dirichletr" + str(j))
                        self.pdfs.append("uniform")
                        self.limits.append((0.0, 1.0))
                        self.hyper_params.append({})

        # Find the dimensionality of the fit
        self.ndim = len(self.params)


[docs]
    def update_model_components(
        self,
        param: ArrayLike,
    ) -> dict:
        """
        Generate a model object with the current parameters.

        Originally from `bagpipes.fitting.fitted_model`, modified to allow
        for running in parallel (no attributes overwritten).

        Parameters
        ----------
        param : ArrayLike
            The array of parameters to be updated.

        Returns
        -------
        dict
            The updated components for a model galaxy.
        """

        new_components = deepcopy(self.model_components)

        dirichlet_comps = []

        # Substitute values of fit params from param into model_comp.
        for i in range(len(self.params)):
            split = self.params[i].split(":")
            if len(split) == 1:
                new_components[self.params[i]] = param[i]

            elif len(split) == 2:
                if "dirichlet" in split[1]:
                    if split[0] not in dirichlet_comps:
                        dirichlet_comps.append(split[0])

                else:
                    new_components[split[0]][split[1]] = param[i]

        # Set any mirror params to the value of the relevant fit param.
        for key in list(self.mirror_pars):
            split_par = key.split(":")
            split_val = self.mirror_pars[key].split(":")
            fit_val = new_components[split_val[0]][split_val[1]]
            new_components[split_par[0]][split_par[1]] = fit_val

        # Deal with any Dirichlet distributed parameters.
        if len(dirichlet_comps) > 0:
            comp = dirichlet_comps[0]
            n_bins = 0
            for i in range(len(self.params)):
                split = self.params[i].split(":")
                if (split[0] == comp) and ("dirichlet" in split[1]):
                    n_bins += 1

            new_components[comp]["r"] = np.zeros(n_bins)

            j = 0
            for i in range(len(self.params)):
                split = self.params[i].split(":")
                if (split[0] == comp) and "dirichlet" in split[1]:
                    new_components[comp]["r"][j] = param[i]
                    j += 1

            tx = dirichlet(new_components[comp]["r"], new_components[comp]["alpha"])

            new_components[comp]["tx"] = tx

        # new_components["veldisp"] = 1100.

        return new_components



[docs]
    def sample(
        self,
        param_vector: ArrayLike,
        cont_only: bool = False,
        rm_line: list[str] | str | None = None,
        return_line_flux: bool = False,
        **model_kwargs,
    ) -> ArrayLike:
        """
        Regenerate a model spectrum from a sampled parameter vector.

        Parameters
        ----------
        param_vector : ArrayLike
            The array of parameters to be updated.
        cont_only : bool, optional
            If ``True``, the model spectrum will be generated without any
            nebular emission. By default ``False``.
        rm_line : list[str] | None, optional
            The names of one or more lines to exclude from the model
            spectrum, based on the `Cloudy <https://www.nublado.org/>`__
            naming convention (see `here
            <https://bagpipes.readthedocs.io/en/latest/model_galaxies.html#getting-observables-line-fluxes>`__
            for more details). By default ``None``.
        return_line_flux : bool, optional
            If ``True``, return the total line flux for all lines named in
            ``rm_line``. By default ``False``.
        **model_kwargs : dict, optional
            Any additional keyword arguments to pass to
            `~niriss_tools.grism.specgen.ExtendedModelGalaxy`.

        Returns
        -------
        ArrayLike
            A 2D array, containing the wavelengths and corresponding
            fluxes of the modelled galaxy spectrum.
        """

        new_comps = self.update_model_components(param_vector)

        if self.model_gal is None:
            self.model_gal = ExtendedModelGalaxy(new_comps, **model_kwargs)

        self.model_gal.update(new_comps, cont_only=cont_only, rm_line=rm_line)

        if return_line_flux:
            line_flux = 0.0
            if rm_line is not None:
                rm_line = np.atleast_1d(rm_line).ravel()
                for rm in rm_line:
                    line_flux += self.model_gal.line_fluxes[rm]
            return self.model_gal.spectrum.T, line_flux
        else:
            return self.model_gal.spectrum.T




def _init_spec_sampler(fit_instructions, veldisp):
    global spec_sampler
    spec_sampler = BagpipesSampler(fit_instructions=fit_instructions, veldisp=veldisp)


def create_spec_file(
    post_id: str,
    posterior_dir: Path | None = None,
    spec_dir: Path | None = None,
    spec_wavs: ArrayLike | None = None,
) -> None:
    """
    Generated resampled spectra from a bagpipes posterior output.

    Parameters
    ----------
    post_id : str
        The ID of the posterior ``"*.h5"`` file.
    posterior_dir : Path | None, optional
        The directory containing the posterior file, by default ``None``.
    spec_dir : Path | None, optional
        The directory containing the spectral file, by default ``None``.
    spec_wavs : ArrayLike | None, optional
        The wavelengths onto which the spectrum will be resampled, by
        default ``None``.
    """

    with h5py.File(posterior_dir / f"{post_id}.h5", "r") as post_file:
        samples2d = np.array(post_file["samples2d"])

    with h5py.File(spec_dir / f"{post_id}.h5", "a") as spec_file:

        if not spec_file.get("spec_data"):

            if not spec_file.get("spec_wavs"):

                spec_file.create_dataset("spec_wavs", data=spec_wavs)

            unique_vectors, unique_inv = np.unique(
                samples2d, axis=0, return_inverse=True
            )
            spec_data = np.zeros((unique_vectors.shape[0], spec_wavs.shape[0]))

            for s_i, param_vector in enumerate(unique_vectors):
                spec_data[s_i] = spec_sampler.sample(
                    param_vector,
                    spec_wavs=spec_wavs,
                )[1]

            spec_file.create_dataset("spec_data", data=spec_data[unique_inv])


def pre_gen_spec(
    pipes_dir: Path,
    fit_instructions: dict,
    spec_wavs: ArrayLike,
    veldisp: float = 500,
    run: str = "",
    cpu_count: int | None = None,
) -> None:
    """
    Generate resampled spectra for all posterior samples.

    Parameters
    ----------
    pipes_dir : Path
        The main bagpipes directory.
    fit_instructions : dict
        A dictionary containing the details of the model, as well as any
        constraints and priors on the parameters.
    spec_wavs : `ArrayLike`
        An array of wavelengths at which spectral fluxes should be
        returned.
    veldisp : float, optional
        The velocity dispersion of the model galaxy in km/s. By default
        ``veldisp=500``.
    run : str, optional
        The subfolder into which outputs will be saved, useful e.g.
        for fitting more than one model configuration to the same
        data, by default ``""``.
    cpu_count : int, optional
        The number of processes to use when generating the spectra. If
        ``None`` (default), this will run on the number of
        cores returned by  `multiprocessing.cpu_count`.
    """

    posterior_dir = pipes_dir / "posterior" / run

    spec_dir = pipes_dir / "spec" / run
    spec_dir.mkdir(exist_ok=True, parents=True)

    post_ids = [f.stem for f in posterior_dir.glob("*.h5")]

    if not len(post_ids) > 0:
        return

    # Generate the spectra
    print("Generating resampled spectra...")
    pbar = tqdm(total=len(post_ids))

    def _update(*a):
        pbar.update()

    with Pool(
        processes=cpu_count,
        initializer=_init_spec_sampler,
        initargs=(
            fit_instructions,
            veldisp,
        ),
    ) as pool:
        for p_i, p in enumerate(post_ids):
            pool.apply_async(
                create_spec_file,
                (p,),
                kwds=dict(
                    posterior_dir=posterior_dir,
                    spec_dir=spec_dir,
                    spec_wavs=spec_wavs,
                ),
                error_callback=print,
                callback=_update,
            )
        pool.close()
        pool.join()
        pbar.close()