Source code for exoiris.exoiris

#  ExoIris: fast, flexible, and easy exoplanet transmission spectroscopy in Python.
#  Copyright (C) 2024 Hannu Parviainen
#
#  This program is free software: you can redistribute it and/or modify
#  it under the terms of the GNU General Public License as published by
#  the Free Software Foundation, either version 3 of the License, or
#  (at your option) any later version.
#
#  This program is distributed in the hope that it will be useful,
#  but WITHOUT ANY WARRANTY; without even the implied warranty of
#  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
#  GNU General Public License for more details.
#
#  You should have received a copy of the GNU General Public License
#  along with this program.  If not, see <https://www.gnu.org/licenses/>.

import codecs
import json
import pickle
from collections.abc import Sequence
from multiprocessing import Pool
from pathlib import Path
from typing import Optional, Callable, Any, Literal

import astropy.io.fits as pf
import astropy.units as u
import matplotlib.axes
import pandas as pd
from astropy.table import Table
from celerite2 import GaussianProcess, terms
from emcee import EnsembleSampler
from matplotlib.pyplot import subplots, setp, figure, Figure, Axes
from numpy import (any, where, sqrt, clip, percentile, median, squeeze, floor, ndarray, isfinite,
                   array, inf, arange, argsort, concatenate, full, nan, r_, nanpercentile, log10,
                   ceil, unique, zeros, cov)
from numpy.typing import ArrayLike
from numpy.random import normal
from pytransit import UniformPrior, NormalPrior
from pytransit.param import ParameterSet
from pytransit.utils.de import DiffEvol
from scipy.stats import norm
from uncertainties import UFloat

from .ldtkld import LDTkLD
from .tsdata import TSData, TSDataGroup
from .tslpf import TSLPF, interpolators
from .wlpf import WhiteLPF
from .loglikelihood import LogLikelihood



[docs]
def load_model(fname: Path | str, name: str | None = None):
    """Load an ExoIris analysis from a FITS file.

    Parameters
    ----------
    fname
        The name of the savefile.
    name
        The name of the new ExoIris model. If not provided, the original analysis name will be used.

    Returns
    -------
    ExoIris
        The saved ExoIris analysis.

    Raises
    ------
    IOError
        If there is an error while opening or reading the file.

    ValueError
        If the file format is invalid or does not match the expected format.
    """
    with pf.open(fname) as hdul:
        data = TSDataGroup.import_fits(hdul)
        hdr = hdul[0].header

        # Read the limb darkening model.
        # ==============================
        if hdr['LDMODEL'] == 'ldtk':
            filters, teff, logg, metal, dataset = pickle.loads(codecs.decode(json.loads(hdr['LDTKLD']).encode(), "base64"))
            ldm = LDTkLD(filters, teff, logg, metal, dataset=dataset)
        else:
            ldm =  hdr['LDMODEL']

        # Read the interpolation model.
        # =============================
        try:
            ip = hdr['INTERP']
        except KeyError:
            ip = 'linear'

        # Read the interpolation model.
        # =============================
        try:
            ip_ld = hdr['INTERP_LD']
        except KeyError:
            ip_ld = 'bspline-quadratic'

        # Read the noise model.
        # =====================
        try:
            noise_model = hdr['NOISE']
        except KeyError:
            noise_model = "white"

        # Setup the analysis.
        # ===================
        a = ExoIris(name or hdr['NAME'], ldmodel=ldm, data=data, noise_model=noise_model, interpolation=ip)
        a.set_limb_darkening_interpolator(ip_ld)
        a.set_radius_ratio_knots(hdul['K_KNOTS'].data.astype('d'))
        a.set_limb_darkening_knots(hdul['LD_KNOTS'].data.astype('d'))

        # Read the white light curve models if they exist.
        # ================================================
        try:
            tb = Table.read(hdul['WHITE_DATA'])
            white_ids = tb['id'].data
            uids = unique(white_ids)
            a._white_times = [tb['time'].data[white_ids == i] for i in uids]
            a._white_fluxes = [tb['flux_obs'].data[white_ids == i] for i in uids]
            a._white_errors = [tb['flux_obs_err'].data[white_ids == i] for i in uids]
            a._white_models = [tb['flux_mod'].data[white_ids == i] for i in uids]
        except KeyError:
            pass

        # Read the ephemeris if it exists.
        # ================================
        try:
            a.period = hdr['P']
            a.zero_epoch = hdr['T0']
            a.transit_duration = hdr['T14']
            [d.mask_transit(a.zero_epoch, a.period, a.transit_duration) for d in a.data]
        except (KeyError, ValueError):
            pass

        # Read the spots if they exist.
        # =============================
        if 'SPOTS' in hdr and hdr['SPOTS'] is True:
            a.initialize_spots(hdr["SP_TSTAR"], hdr["SP_REFWL"], hdr["SP_TLSE"])
            for i in range(hdr['NSPOTS']):
                a.add_spot(hdr[f'SP{i+1:02d}_EG'])

        # Read the free k knot indices if they exist.
        # ==========================================
        if 'N_FREE_K' in hdr and hdr['N_FREE_K'] > 0:
            n_free_k = hdr['N_FREE_K']
            a._tsa.set_free_k_knots([int(hdr[f'KK_IX_{i:03d}']) for i in range(n_free_k)])

        # Read the priors.
        # ================
        priors = pickle.loads(codecs.decode(json.loads(hdul['PRIORS'].header['PRIORS']).encode(), "base64"))
        for praw in priors:
            p = pickle.loads(praw)
            if p.name in a._tsa.ps.names:
                a._tsa.set_prior(p.name, p.prior)

        if 'DE' in hdul:
            a._tsa._de_population = Table(hdul['DE'].data).to_pandas().values
            a._tsa._de_imin = hdul['DE'].header['IMIN']
        if 'MCMC' in hdul:
            npop = hdul['MCMC'].header['NPOP']
            ndim = hdul['MCMC'].header['NDIM']
            a._tsa._mc_chains = Table(hdul['MCMC'].data).to_pandas().values.reshape([npop, -1, ndim])
        return a




[docs]
class ExoIris:
    """The core ExoIris class providing tools for exoplanet transit spectroscopy.
    """


[docs]
    def __init__(self, name: str, ldmodel, data: TSDataGroup | TSData, nk: int = 50, nldc: int = 10, nthreads: int = 1,
                 tmpars: dict | None = None, noise_model: Literal["white_profiled", "white_marginalized", "fixed_gp", "free_gp"] = 'white_profiled',
                 interpolation: Literal['nearest', 'linear', 'pchip', 'makima', 'bspline', 'bspline-quadratic', 'bspline-cubic'] = 'linear'):
        """
        Parameters
        ----------
        name
            The name of the instance.
        ldmodel
            The model for the limb darkening.
        data
            The time-series data object.
        nk
            The number of kernel samples.
        nldc
            The number of limb darkening coefficients.
        nthreads
            The number of threads to use for computation.
        tmpars
            Additional transit model parameters.
        noise_model
            The noise model to use. Should be either "white" for white noise or "fixed_gp" for Gaussian Process.
        """
        data = TSDataGroup([data]) if isinstance(data, TSData) else data

        for d in data:
            if any(~isfinite(d.fluxes[d.mask])):
                raise ValueError(f"The {d.name} data set flux array contains unmasked noninfinite values.")

            if any(~isfinite(d.errors[d.mask])):
                raise ValueError(f"The {d.name} data set error array contains unmasked noninfinite values.")

        ngs = array(data.noise_groups)
        if not ((ngs.min() == 0) and (ngs.max() + 1 == unique(ngs).size)):
            raise ValueError("The noise groups must start from 0 and be consecutive.")

        ogs = array(data.offset_groups)
        if not ((ogs.min() == 0) and (ogs.max() + 1 == unique(ogs).size)):
            raise ValueError("The offset groups must start from 0 and be consecutive.")

        egs = array(data.epoch_groups)
        if not ((egs.min() == 0) and (egs.max() + 1 == unique(egs).size)):
            raise ValueError("The epoch groups must start from 0 and be consecutive.")

        self._tsa = TSLPF(self, name, ldmodel, data, nk=nk, nldc=nldc, nthreads=nthreads, tmpars=tmpars,
                                 noise_model=noise_model, interpolation=interpolation)
        self._wa: None | WhiteLPF = None

        self.nthreads: int = nthreads

        self.period: float | None = None
        self.zero_epoch: float | None = None
        self.transit_duration: float | None= None
        self._tref = floor(self.data.tmin)

        self._white_times: None | list[ndarray] = None
        self._white_fluxes: None | list[ndarray] = None
        self._white_errors: None | list[ndarray] = None
        self._white_models: None | list[ndarray] = None
        self.white_gp_models: None | list[ndarray] = None



[docs]
    def lnposterior(self, pvp: ndarray) -> ndarray:
        """Calculate the log posterior probability for a single parameter vector or an array of parameter vectors.

        Parameters
        ----------
        pvp
            The vector of parameter values or an array of parameter vectors with a shape [npv, np].

        Returns
        -------
        ndarray
            The natural logarithm of the posterior probability.
        """
        return squeeze(self._tsa.lnposterior(pvp))



[docs]
    def set_noise_model(self, noise_model: Literal['white', 'fixed_gp', 'free_gp']) -> None:
        """Set the noise model for the analysis.

        Parameters
        ----------
        noise_model
            The noise model to be used.

        Raises
        ------
        ValueError
            If noise_model is not one of the specified options.
        """
        self._tsa.set_noise_model(noise_model)



[docs]
    def set_data(self, data: TSData | TSDataGroup) -> None:
        """Set the model data.

        Parameters
        ----------
        data
           The spectroscopic transit light curve.
        """
        data = TSDataGroup([data]) if isinstance(data, TSData) else data
        self._tsa.set_data(data)



[docs]
    def set_prior(self, parameter: Literal['radius ratios', 'offsets', 'wn multipliers'] | str,
                  prior: str | Any, *nargs) -> None:
        """Set a prior on a model parameter.

        Parameters
        ----------
        parameter
            The name of the parameter to set a prior for. Can also be 'radius ratios', 'offsets', or 'wn multipliers'
            to set identical priors on all the radius ratios, offsets, or white noise multipliers.

        prior
            The prior distribution for the parameter. This can be "NP" for a normal prior, "UP" for a
            uniform prior, or an object with .logpdf(x) method.

        *nargs
            Additional arguments to be passed to the prior: (mean, std) for the normal prior and (min, max)
            for the uniform prior.
        """
        if parameter == 'radius ratios':
            for l in self._tsa.k_knots:
                self.set_prior(f'k_{l:08.5f}', prior, *nargs)
        elif parameter == 'wn multipliers':
            for par in self.ps[self._tsa._sl_wnm]:
                self.set_prior(par.name, prior, *nargs)
        elif parameter == 'offsets':
            for par in self.ps[self._tsa._sl_bias]:
                self.set_prior(par.name, prior, *nargs)
        else:
            self._tsa.set_prior(parameter, prior, *nargs)



[docs]
    def set_radius_ratio_prior(self, prior, *nargs) -> None:
        """Set an identical prior on all radius ratio (k) knots.

        Parameters
        ----------
        prior
            The prior for the radius ratios. This can be "NP" for a normal prior, "UP" for a uniform prior,
            or an object with .logpdf(x) method.
        *nargs
            Additional arguments for the prior.
        """
        for l in self._tsa.k_knots:
            self.set_prior(f'k_{l:08.5f}', prior, *nargs)



[docs]
    def set_baseline_prior(self, prior, *nargs) -> None:
        """Set an identical prior on all baseline knots.

        Parameters
        ----------
        prior
            The prior for the baseline knots.  This can be "NP" for a normal prior, "UP" for a uniform prior,
            or an object with .logpdf(x) method.
        *nargs
            Additional arguments for the prior.
        """
        for par in self.ps[self._tsa._sl_baseline]:
            self.set_prior(par.name, prior, *nargs)



[docs]
    def set_ldtk_prior(self,
                       teff: UFloat | tuple[float, float],
                       logg: UFloat | tuple[float, float],
                       metal: UFloat | tuple[float, float],
                       dataset: str = 'visir-lowres', width: float = 50.0, uncertainty_multiplier: float = 10.0):
        """Set priors on the limb darkening parameters using LDTk.

        Sets priors on the limb darkening parameters based on theoretical stellar models using LDTk.

        Parameters
        ----------
        teff
            The effective temperature and its uncertainty in Kelvin.
        logg
            The surface gravity and its uncertainty in cm/s^2.
        metal
            The metallicity and its uncertainty.
        dataset
            The name of the dataset. Default is 'visir-lowres'.
        width
            The passband width in nanometers. Default is 50.
        uncertainty_multiplier
            The uncertainty multiplier to adjust the width of the prior. Default is 10.

        """
        teff = (teff.n, teff.s) if isinstance(teff, UFloat) else teff
        logg = (logg.n, logg.s) if isinstance(logg, UFloat) else logg
        metal = (metal.n, metal.s) if isinstance(metal, UFloat) else metal
        self._tsa.set_ldtk_prior(teff, logg, metal, dataset, width, uncertainty_multiplier)



[docs]
    def set_gp_hyperparameters(self, sigma: float, rho: float, idata: None | int = None) -> None:
        """Set Gaussian Process (GP) hyperparameters assuming a Matern-3/2 kernel.

        Parameters
        ----------
        sigma
            The kernel amplitude parameter.
        rho
            The length scale parameter.
        idata
            The data set for which to set the hyperparameters. If None, the hyperparameters are set for all data sets.
        """
        self._tsa.set_gp_hyperparameters(sigma, rho, idata)



[docs]
    def set_gp_kernel(self, kernel: terms.Term) -> None:
        """Set the Gaussian Process (GP) kernel.

        Parameters
        ----------
        kernel
            The kernel to set for the GP.
        """
        self._tsa.set_gp_kernel(kernel)



[docs]
    def initialize_spots(self, tstar: float, wlref: float, include_tlse: bool = True):
        """Initialize star spot model using given stellar and wavelength reference values.

        Parameters
        ----------
        tstar
            Effective stellar temperature [K].
        wlref
            Reference wavelength where spot amplitude matches the amplitude parameter.
        """
        self._tsa.initialize_spots(tstar, wlref, include_tlse)



[docs]
    def add_spot(self, epoch_group: int) -> None:
        """Add a new star spot and associate it with an epoch group.

        Parameters
        ----------
        epoch_group
            Identifier for the epoch group to which the spot will be added.
        """
        self._tsa.add_spot(epoch_group)


    @property
    def nspots(self) -> int:
        """Number of star spots."""
        if self._tsa.spot_model is None:
            return 0
        else:
            return self._tsa.spot_model.nspots

    @property
    def name(self) -> str:
        """Analysis name."""
        return self._tsa.name

    @name.setter
    def name(self, name: str):
        self._tsa.name = name

    @property
    def data(self) -> TSDataGroup:
        """Analysis data set."""
        return self._tsa.data

    @property
    def k_knots(self) -> ndarray:
        """Radius ratio (k) knots."""
        return self._tsa.k_knots

    @property
    def ndim(self) -> int:
        """Number of free model parameters."""
        return self._tsa.ndim

    @property
    def nk(self) -> int:
        """Number of radius ratio (k) knots."""
        return self._tsa.nk

    @property
    def nldp(self) -> int:
        """Number of limb darkening knots."""
        return self._tsa.nldc

    @property
    def npb(self) -> list[int]:
        """Number of passbands for each data set."""
        return self._tsa.npb

    @property
    def ldmodel(self):
        """The limb darkening model."""
        return self._tsa.ldmodel

    @property
    def sampler(self) -> EnsembleSampler |None:
        """The emcee sampler."""
        return self._tsa.sampler

    @property
    def optimizer(self) -> DiffEvol | None:
        """The global optimization algorithm."""
        return self._tsa.de

    @property
    def gp(self) -> list[GaussianProcess]:
        """Gaussian Process (GP) models."""
        return self._tsa._gp

    @property
    def optimizer_population(self) -> ndarray:
        """DE optimizer parameter vector population."""
        return self._tsa._de_population

    @property
    def mcmc_chains(self) -> ndarray:
        """Emcee sampler MCMC chains."""
        return self._tsa._mc_chains

    @property
    def posterior_samples(self) -> pd.DataFrame:
        """Posterior samples from the MCMC sampler."""
        return pd.DataFrame(self._tsa._mc_chains.reshape([-1, self.ndim]), columns=self.ps.names)

    @property
    def white_times(self) -> list[ndarray]:
        """White light curve time arrays."""
        if self._wa is None:
            return self._white_times
        else:
            return self._wa.times

    @property
    def white_fluxes(self) -> list[ndarray]:
        """White light curve flux arrays."""
        if self._wa is None:
            return self._white_fluxes
        else:
            return self._wa.fluxes

    @property
    def white_models(self) -> list[ndarray]:
        """Fitted white light curve flux model arrays."""
        if self._wa is None:
            return self._white_models
        else:
            fm = self._wa.flux_model(self._wa._local_minimization.x)
            return [fm[sl] for sl in self._wa.lcslices]

    @property
    def white_errors(self) -> list[ndarray]:
        """White light curve flux error arrays."""
        if self._wa is None:
            return self._white_errors
        else:
            return self._wa.std_errors


[docs]
    def set_radius_ratio_interpolator(self, interpolator: str) -> None:
        """Set the interpolator for the radius ratio (k) model."""
        if interpolator not in interpolators.keys():
            raise ValueError(f"Interpolator {interpolator} not recognized.")
        self._tsa.set_k_interpolator(interpolator)



[docs]
    def add_radius_ratio_knots(self, knot_wavelengths: Sequence) -> None:
        """Add radius ratio (k) knots.

        Parameters
        ----------
        knot_wavelengths
            List or array of knot wavelengths to be added.
        """
        self._tsa.add_k_knots(knot_wavelengths)



[docs]
    def set_radius_ratio_knots(self, knot_wavelengths: Sequence) -> None:
        """Set the radius ratio (k) knots.

        Parameters
        ----------
        knot_wavelengths
            List or array of knot wavelengths.
        """
        self._tsa.set_k_knots(knot_wavelengths)



[docs]
    def free_radius_ratio_knot_locations(self, knot_ids: list[int] | ndarray) -> None:
        """Add the wavelength locations of chosen radius ratio knots to the model as free parameters.

        Parameters
        ----------
        knot_ids
            List of radius ratio knot indices to be made free parameters.
        """
        self._tsa.free_k_knot_locations(knot_ids)



[docs]
    def create_dense_radius_ratio_block(self, wlmin: float, wlmax: float) -> None:
        """Create a block of radius ratio knots using the full data resolution.

        Creates a block of radius ratio knots using the full data resolution that replaces
        any existing radius ratio knots inside the block.

        Parameters
        ----------
        wlmin
            The minimum wavelength for the full-resolution block.
        wlmax
            The maximum wavelength for the full-resolution block.
        """
        ck = self._tsa.k_knots
        nk = concatenate(self.data.wavelengths)
        nk.sort()
        nk = nk[(nk >= wlmin) & (nk <= wlmax)]
        self.set_radius_ratio_knots(r_[ck[ck < nk[0]], nk, ck[ck > nk[-1]]])



[docs]
    def set_limb_darkening_interpolator(self, interpolator: str) -> None:
        """Set the interpolator for the limb darkening model."""
        if interpolator not in interpolators.keys():
            raise ValueError(f"Interpolator {interpolator} not recognized.")
        self._tsa.set_ld_interpolator(interpolator)


    def add_limb_darkening_knots(self, knot_wavelengths: Sequence) -> None:
        """Add limb darkening knots.

        Parameters
        ----------
        knot_wavelengths
            List or array of knot wavelengths to be added.
        """
        raise NotImplementedError()
        self._tsa.add_limb_darkening_knots(knot_wavelengths)


[docs]
    def set_limb_darkening_knots(self, knot_wavelengths: Sequence) -> None:
        """Set the limb darkening knots.

        Parameters
        ----------
        knot_wavelengths
            List or array of knot wavelengths.
        """
        self._tsa.set_ld_knots(knot_wavelengths)


    @property
    def ps(self) -> ParameterSet:
        """Model parameterization."""
        return self._tsa.ps


[docs]
    def print_parameters(self) -> None:
        """Print the model parameterization."""
        self._tsa.print_parameters(1)



[docs]
    def plot_setup(self, figsize: tuple[float, float] | None = None,
                   ax: matplotlib.axes.Axes | None = None,
                   xscale: str | None = None, xticks: Sequence | None = None,
                   yshift: float = 0.1, mh:float = 0.08, side_margin: float = 0.05,
                   lw: float = 0.5, c='k') -> Figure:
        """Plot the model setup with limb darkening knots, radius ratio knots, and data binning.
        """
        if ax is None:
            fig, ax = subplots(figsize=figsize, constrained_layout=True)
        else:
            fig = ax.figure

        ndata = self.data.size

        for i, d in enumerate(self.data):
            ax.vlines(d.wavelength, ymin=i*yshift, ymax=i*yshift+mh, colors=c, lw=lw)

        i = ndata + 1
        ax.vlines(self._tsa.ld_knots, ymin=i*yshift, ymax=i*yshift+mh, colors=c, lw=lw)

        i = ndata + 3
        ax.vlines(self.k_knots, ymin=i*yshift, ymax=i*yshift+mh, colors=c, lw=lw)

        if xscale:
            setp(ax, xscale=xscale)
        if xticks is not None:
            ax.set_xticks(xticks, labels=xticks)

        setp(ax, yticks=[], xlim=(self.data.wlmin-side_margin, self.data.wlmax+side_margin), xlabel=r'Wavelength [$\mu$m]')
        ax.set_yticks(concatenate([arange(ndata), arange(ndata+1, ndata+4, 2)])*yshift+0.5*mh, labels=[n.replace("_", " ") for n in self.data.names] + ["Limb darkening knots", "Radius ratio knots"])
        return fig



[docs]
    def fit_white(self, niter: int = 500) -> None:
        """Fit a white light curve model and sets the out-of-transit mask.

        Parameters
        ----------
        niter : int, optional
            The number of iterations for the global optimization algorithm (default is 500).
        """
        self._wa = WhiteLPF(self._tsa)
        self._wa.optimize_global(niter, plot_convergence=False, use_tqdm=False)
        self._wa.optimize()
        pv = self._wa._local_minimization.x
        self.period = pv[0]
        self.zero_epoch = self._wa.transit_center
        self.transit_duration = self._wa.transit_duration
        self.data.mask_transit(self.zero_epoch, self.period, self.transit_duration)



[docs]
    def plot_white(self, axs=None, figsize: tuple[float, float] | None = None, ncols: int | None=None) -> Figure:
        """Plot the white light curve data with the best-fit model.

        Parameters
        ----------
        axs : Axes, optional
            Matplotlib axis object on which to plot. If None, a new figure and axis will be created.
        figsize
            Tuple representing the figure size in inches.
        ncols
            Number of columns in the plot layout.
        """
        return self._wa.plot(axs=axs, figsize=figsize, ncols=ncols or min(self.data.size, 2))



[docs]
    def plot_white_gp_predictions(self, axs = None, ncol: int = 1, figsize: tuple[float, float] | None = None) -> None:
        """Plot the predictions of a Gaussian Process model for white light curves and residuals.

        Parameters
        ----------
        axs
            Axes array in which the plots are drawn. If None, new subplots are generated.
        ncol
            The number of columns for the created grid of subplots. Used only if axs is None.
        figsize
            Size of the figure in inches (width, height). Used only if axs is None. If None,
            a default size is used.

        Notes
        -----
        The number of rows for the subplots is determined dynamically based on the shape of
        the data and the number of columns specified (ncol). If the provided axes array (axs)
        does not accommodate all the subplots, the behavior is undefined.
        """
        if self.white_gp_models is None:
            raise ValueError("White light curve GP predictions are not available. Run 'optimize_gp_hyperparameters' first.")

        ndata = self.data.size

        if axs is None:
            nrow = int(ceil(ndata / ncol))
            fig, axs = subplots(nrow, ncol, sharey='all', constrained_layout=True, squeeze=False, figsize=figsize)
        else:
            fig = axs[0].axes

        for i in range(ndata):
            tref = floor(self.white_times[i][0])
            axs.flat[i].plot(self.white_times[i] - tref, self.white_fluxes[i]-self.white_models[i])
            axs.flat[i].plot(self.white_times[i] - tref, self.white_gp_models[i], 'k')
            setp(axs.flat[i], xlabel=f'Time - {tref:.0f} [d]', xlim=self.white_times[i][[0,-1]]-tref)
        setp(axs[:, 0], ylabel='Residuals')



[docs]
    def normalize_baseline(self, deg: int = 1) -> None:
        """Normalize the baseline flux for each spectroscopic light curve.

        Normalize the baseline flux using a low-order polynomial fitted to the out-of-transit
        data for each spectroscopic light curve.

        Parameters
        ----------
        deg
            The degree of the fitted polynomial. Should be 0 or 1. Higher degrees are not allowed
            because they could affect the transit depths.

        Raises
        ------
        ValueError
            If `deg` is greater than 1.

        Notes
        -----
        This method normalizes the baseline of the fluxes for each planet. It fits a polynomial of degree
        `deg` to the out-of-transit data points and divides the fluxes by the fitted polynomial evaluated
        at each time point.
        """
        for d in self.data:
            d.normalize_to_poly(deg)



[docs]
    def plot_baseline(self, axs: Optional[Sequence[Axes]] = None, figsize=None) -> Figure:
        """Plot the out-of-transit spectroscopic light curves before and after the normalization.

        Parameters
        ----------
        axs
            Array of axes to plot on. If None, new axes will be created.

        Returns
        -------
        Figure
            The figure containing the subplots.
        """
        if axs is None:
            fig, axs = subplots(self.data.size, 2, figsize=figsize, squeeze=False, constrained_layout=True)
        else:
            fig = axs[0, 0].figure

        for i in range(self.data.size):
            self._tsa._original_data[i].plot(ax=axs[i, 0], data=where(self.data[i].transit_mask, self._tsa._original_data[i].fluxes, 1))
            self.data[i].plot(ax=axs[i, 1], data=where(self.data[i].transit_mask, self.data[i].fluxes, 1))
        return fig



[docs]
    def fit(self, niter: int = 200, npop: Optional[int] = None, pool: Optional[Pool] = None, lnpost: Optional[Callable]=None,
            population: Optional[ndarray] = None, initial_population: Optional[ndarray] = None,
            min_ptp: float = 2.0, plot_convergence: bool = True) -> None:
        """Fit the spectroscopic light curves jointly using Differential Evolution.

        Fit the spectroscopic light curves jointly for `niter` iterations using Differential Evolution.

        Parameters
        ----------
        niter
            Number of iterations for optimization. Default is 200.
        npop
            Population size for optimization. Default is 150.
        pool
            Multiprocessing pool for parallel optimization. Default is None.
        lnpost
            Log posterior function for optimization. Default is None.
        """
        if population is not None:
            x0 = population
            npop = x0.shape[0]
        else:
            if self._tsa.de is None and initial_population is not None:
                x0 = initial_population
                npop = x0.shape[0]
            elif self._tsa._de_population is not None:
                x0 = self._tsa._de_population
                npop = x0.shape[0]
            else:
                if npop is None:
                    raise ValueError("'npop' cannot be None when starting global optimization from the white light curve fit.'")
                if npop <= 2*self._tsa.ndim:
                    raise ValueError("'npop' should be at least two times the number of free model parameters.")

                pv0 = self._wa._local_minimization.x
                x0 = self._tsa.ps.sample_from_prior(npop)
                x0[:, 0] = clip(normal(pv0[1], 0.05, size=npop), 0.01, inf)
                x0[:, 1] = clip(normal(pv0[0], 1e-4, size=npop), 0.01, inf)
                x0[:, 2] = clip(normal(pv0[2], 1e-3, size=npop), 0.0, 1.0)

                nep = max(self.data.epoch_groups) + 1
                for i in range(nep):
                    pida = self.ps.find_pid(f'tc_{i:02d}')
                    pidb = self._wa.ps.find_pid(f'tc_{i:02d}')
                    x0[:, pida] = normal(pv0[pidb], 0.001, size=npop)

                sl = self._tsa._sl_rratios
                x0[:, sl] = normal(sqrt(pv0[self._wa.ps.find_pid('k2')]), 0.001, size=(npop, self.nk))
                for i in range(sl.start, sl.stop):
                    x0[:, i] = clip(x0[:, i], 1.001*self.ps[i].prior.a, 0.999*self.ps[i].prior.b)

        self._tsa.optimize_global(niter=niter, npop=npop, population=x0, pool=pool, lnpost=lnpost,
                                  vectorize=(pool is None), min_ptp=min_ptp, plot_convergence=plot_convergence)
        self.de = self._tsa.de



[docs]
    def sample(self, niter: int = 500, thin: int = 10, repeats: int = 1, pool=None, lnpost=None, leave=True, save=False, use_tqdm: bool = True):
        """Sample the posterior distribution using the emcee MCMC sampler.

        Parameters
        ----------
        niter
            Number of iterations in the MCMC sampling. Default is 500.
        thin
            Thinning factor for the MCMC samples. Default is 10.
        repeats
            Number of repeated iterations in the MCMC sampling. Default is 1.
        pool
            Parallel processing pool object to use for parallelization. Default is None.
        lnpost
            Log posterior function that takes a parameter vector as input and returns the log posterior probability.
            Default is None.
        leave
            Whether to leave the progress bar visible after sampling is finished. Default is True.
        save
            Whether to save the MCMC samples to disk. Default is False.
        use_tqdm
            Whether to use tqdm progress bar during sampling. Default is True.

        """
        self._tsa.sample_mcmc(niter=niter, thin=thin, repeats=repeats, pool=pool, lnpost=lnpost,
                              vectorize=(pool is None), leave=leave, save=save, use_tqdm=use_tqdm)



[docs]
    def reset(self, optimizer: bool = True, sampler: bool = True) -> None:
        """Reset the internal states of the optimizer and sampler.

        Parameters
        ----------
        optimizer
            If True, clears all the internal attributes associated with the optimizer.
        sampler
            If True, clears all the internal attributes associated with the sampler.

        Returns
        -------
        None
        """
        if optimizer:
            self._tsa.de = None
            self._tsa._de_population = None
            self._tsa._de_imin = None

        if sampler:
            self._tsa.sampler = None
            self._tsa._mc_chains = None



[docs]
    def reset_sampler(self) -> None:
        """Reset the MCMC sampler

        Reset the MCMC sampler by clearing the Monte Carlo chains and setting the sampler to None.
        """
        self._tsa._mc_chains = None
        self._tsa.sampler = None



[docs]
    def plot_transmission_spectrum(self, result: Optional[str] = None, ax: Axes = None, xscale: Optional[str] = None,
                                   xticks=None, ylim=None,  plot_resolution: bool = True) -> Figure:
        """Plot the transmission spectrum.

        Parameters
        ----------
        result
            The type of result to plot. Can be 'fit', 'mcmc', or None. If None, the default behavior is to use 'mcmc' if
            the MCMC sampler has been run, otherwise 'fit'. Default is None.
        ax
            The matplotlib Axes object to plot on. If None, a new figure and axes will be created. Default is None.
        xscale
            The scale of the x-axis. Can be 'linear', 'log', 'symlog', 'logit', or None. If None, the default behavior is to
            use the scale of the current axes. Default is None.
        xticks
            The tick locations for the x-axis. If None, the default behavior is to use the tick locations of the current axes.
        ylim
            The limits for the y-axis. If None, the default behavior is to use the limits of the current axes.
        plot_resolution
            Whether to plot the resolution of the transmission spectrum as vertical lines. Default is True.

        Returns
        -------
        Figure
            The matplotlib Figure of the plotted transmission spectrum.

        """
        if result is None:
            result = 'mcmc' if self._tsa.sampler is not None else 'fit'
        if result not in ('fit', 'mcmc'):
            raise ValueError("Result must be either 'fit', 'mcmc', or None")
        if result == 'mcmc' and self._tsa._mc_chains is None:
            raise ValueError("Cannot plot posterior solution before running the MCMC sampler.")

        fig, ax = subplots() if ax is None else (ax.get_figure(), ax)

        wavelength = concatenate(self.data.wavelengths)
        ix = argsort(wavelength)

        if result == 'fit':
            pv = self._tsa._de_population[self._tsa._de_imin]
            ks = self._tsa._eval_k(pv)
            ar = 1e2 * concatenate([squeeze(k) for k in ks]) ** 2
            ax.plot(wavelength[ix], ar[ix], c='k')
            ax.plot(self._tsa.k_knots, 1e2 * pv[self._tsa._sl_rratios] ** 2, 'k.')
        else:
            df = pd.DataFrame(self._tsa._mc_chains.reshape([-1, self._tsa.ndim]), columns=self._tsa.ps.names)
            ks = self._tsa._eval_k(df.values)
            ar = 1e2 * concatenate(ks, axis=1) ** 2
            ax.fill_between(wavelength[ix], *percentile(ar[:, ix], [16, 84], axis=0), alpha=0.25)
            ax.plot(wavelength[ix], median(ar, 0)[ix], c='k')
            ax.plot(self.k_knots, 1e2*median(df.iloc[:, self._tsa._sl_rratios].values, 0)**2, 'k.')
        setp(ax, ylabel='Transit depth [%]', xlabel=r'Wavelength [$\mu$m]', xlim=(self.data.wlmin, self.data.wlmax), ylim=ylim)

        if plot_resolution:
            yl = ax.get_ylim()
            ax.vlines(wavelength, yl[0], yl[0]+0.02*(yl[1]-yl[0]), ec='k')
        if xscale is not None:
            ax.set_xscale(xscale)
        if xticks is not None:
            ax.set_xticks(xticks, labels=xticks)
        return ax.get_figure()



[docs]
    def plot_limb_darkening_parameters(
        self,
        result: None | Literal["fit", "mcmc"] = None,
        axs: None | tuple[Axes, Axes] = None,
    ) -> None | Figure:
        """Plot the limb darkening parameters.

        Parameters
        ----------
        result
            The type of result to plot. Can be 'fit', 'mcmc', or None. If None, the default behavior is to use 'mcmc' if
            the MCMC sampler has been run, otherwise 'fit'. Default is None.
        axs
            The axes to plot the limb darkening parameters on. If None, a new figure with subplots will be created.
            Default is None.

        Returns
        -------
        Figure
            The figure containing the plot of the limb darkening parameters.

        Raises
        ------
        ValueError
            If the limb darkening model is not supported.
            If the result is not 'fit', 'mcmc', or None.
            If the result is 'mcmc' and the MCMC sampler has not been run.

        Notes
        -----
        This method plots the limb darkening parameters for two-parameter limb darkening models. It supports only
        quadratic, quadratic-tri, power-2, and power-2-pm models.
        """
        if not self._tsa.ldmodel in (
            "quadratic",
            "quadratic-tri",
            "power-2",
            "power-2-pm",
        ):
            return None

        if axs is None:
            fig, axs = subplots(1, 2, sharey="all", figsize=(13, 4))
        else:
            fig = axs[0].get_figure()

        if result is None:
            result = "mcmc" if self._tsa.sampler is not None else "fit"
        if result not in ("fit", "mcmc"):
            raise ValueError("Result must be either 'fit', 'mcmc', or None")
        if result == "mcmc" and not (
            self._tsa.sampler is not None or self.mcmc_chains is not None
        ):
            raise ValueError(
                "Cannot plot posterior solution before running the MCMC sampler."
            )

        wavelength = concatenate(self.data.wavelengths)
        ix = argsort(wavelength)

        if result == "fit":
            pv = self._tsa._de_population[self._tsa._de_imin]
            ldc = squeeze(concatenate(self._tsa._eval_ldc(pv), axis=1))
            axs[0].plot(self._tsa.ld_knots, pv[self._tsa._sl_ld][0::2], "ok")
            axs[0].plot(wavelength[ix], ldc[:, 0][ix])
            axs[1].plot(self._tsa.ld_knots, pv[self._tsa._sl_ld][1::2], "ok")
            axs[1].plot(wavelength[ix], ldc[:, 1][ix])
        else:
            if self._tsa.sampler is not None:
                pvp = self._tsa._mc_chains.reshape([-1, self._tsa.ndim])
            else:
                pvp = self.mcmc_chains.reshape([-1, self._tsa.ndim])
            ldc = pvp[:, self._tsa._sl_ld]

            ld1m = median(ldc[:, ::2], 0)
            ld1e = ldc[:, ::2].std(0)
            ld2m = median(ldc[:, 1::2], 0)
            ld2e = ldc[:, 1::2].std(0)

            ldc = concatenate(self._tsa._eval_ldc(pvp), axis=1)
            ld1p = percentile(ldc[:, :, 0], [50, 16, 84], axis=0)
            ld2p = percentile(ldc[:, :, 1], [50, 16, 84], axis=0)

            axs[0].fill_between(wavelength[ix], ld1p[1, ix], ld1p[2, ix], alpha=0.5)
            axs[0].plot(wavelength[ix], ld1p[0][ix], "k")
            axs[1].fill_between(wavelength[ix], ld2p[1, ix], ld2p[2, ix], alpha=0.5)
            axs[1].plot(wavelength[ix], ld2p[0][ix], "k")

            axs[0].errorbar(self._tsa.ld_knots, ld1m, ld1e, fmt="ok")
            axs[1].errorbar(self._tsa.ld_knots, ld2m, ld2e, fmt="ok")

        ldp = full((self.nldp, 2, 2), nan)
        for i in range(self.nldp):
            for j in range(2):
                p = self.ps[self._tsa._sl_ld][i * 2 + j].prior
                if isinstance(p, UniformPrior):
                    ldp[i, j, 0] = p.a
                    ldp[i, j, 1] = p.b
                elif isinstance(p, NormalPrior):
                    ldp[i, j, 0] = p.mean - p.std
                    ldp[i, j, 1] = p.mean + p.std

        for i in range(2):
            for j in range(2):
                axs[i].plot(self._tsa.ld_knots, ldp[:, i, j], ":", c="C0")

        setp(
            axs,
            xlim=(wavelength.min(), wavelength.max()),
            xlabel=r"Wavelength [$\mu$m]",
        )
        setp(axs[0], ylabel="Limb darkening coefficient 1")
        setp(axs[1], ylabel="Limb darkening coefficient 2")
        return fig



[docs]
    def plot_residuals(self, result: Optional[str] = None, ax: None | Axes | Sequence[Axes] = None,
                       pmin: float = 1, pmax: float = 99,
                       show_names: bool = False, cmap = None) -> Figure:
        """Plot the model residuals.

        Parameters
        ----------
        result
            The result type to plot. Must be either 'fit', 'mcmc', or None.
        ax
            The axes object to plot on. If None, a new figure and axes will be created.
        pmin
            The lower percentile to use when setting the color scale of the residuals image.
        pmax
            The upper percentile to use when setting the color scale of the residuals image.

        Returns
        -------
        Figure
            The figure object containing the plotted residuals.

        Raises
        ------
        ValueError
            If result is not one of 'fit', 'mcmc', or None.
        ValueError
            If result is 'mcmc' but the MCMC sampler has not been run.

        """
        if result not in ('fit', 'mcmc', None):
            raise ValueError("Result must be either 'fit', 'mcmc', or None")

        if result is None:
            if self._tsa._mc_chains is not None:
                result = 'mcmc'
            elif self._tsa._de_population is not None:
                result = 'fit'
            else:
                raise ValueError("Cannot plot residuals before running either the optimizer or the MCMC sampler.")

        if isinstance(self.data, TSData):
            nrows = 1
        else:
            nrows = self.data.size

        if ax is None:
            fig, axs = subplots(nrows, 1, squeeze=False)
            axs = axs[:, 0]
        else:
            axs = [ax] if isinstance(ax, Axes) else ax
            if len(axs) != self.data.size:
                raise ValueError("The number of axes must match the number of groups in the data.")
            fig = axs[0].figure

        if result == 'fit':
            pv = self._tsa._de_population[self._tsa._de_imin]
        else:
            pv = median(self._tsa._mc_chains.reshape([-1, self._tsa.ndim]), 0)

        fmodel = self._tsa.flux_model(pv)
        for ids, data in enumerate(self.data):
            ax = axs[ids]
            residuals = data.fluxes - squeeze(fmodel[ids])
            pp = nanpercentile(residuals, [pmin, pmax])
            data.plot(ax=ax, data=residuals, vmin=pp[0], vmax=pp[1], cmap=cmap)

            if not show_names:
                ax.set_title("")

        if isinstance(fig, Figure):
            fig.tight_layout()
        return fig



[docs]
    def plot_fit(self, result: Optional[str] = None, figsize: Optional[tuple[float, float]]=None,
                 height_ratios=None,
                 res_args=None, trs_args=None) -> Figure:
        """Plot either the best-fit model or the posterior model.

        Parameters
        ----------
        result
            Should be "fit", "mcmc", or None. Default is None.
        figsize
            The size of the figure in inches. Default is None.
        res_args
            Additional arguments for plotting residuals. Default is None.
        trs_args
            Additional arguments for plotting transmission spectrum. Default is None.

        Returns
        -------
        fig : matplotlib.figure.Figure
            The plotted figure containing the residual plot, transmission spectrum plot, and limb darkening parameters plot.
        """
        if trs_args is None:
            trs_args = {}
        if res_args is None:
            res_args = {}

        fig = figure(layout='constrained', figsize=figsize)
        fts, fbelow = fig.subfigures(2, 1, hspace=0.07, height_ratios=height_ratios)
        fres, fldc = fbelow.subfigures(1, 2, wspace=0.05, width_ratios=(0.5, 0.5))
        axts = fts.add_subplot()
        axs_res = [fres.add_subplot(self.data.size, 1, i + 1) for i in range(self.data.size)]
        axs_ldc = (fldc.add_subplot(2, 1, 1), fldc.add_subplot(2, 1, 2))

        self.plot_transmission_spectrum(result=result, ax=axts, **trs_args)
        self.plot_residuals(result=result, ax=axs_res, **res_args)
        self.plot_limb_darkening_parameters(result=result, axs=axs_ldc)
        fts.suptitle('Transmission spectrum')
        fres.suptitle('Residuals')
        fldc.suptitle('Limb darkening')
        setp(axs_ldc[0].get_xticklabels(), visible=False)
        for i in range(self.data.size - 1):
            setp(axs_res[i].get_xticklabels(), visible=False)
        setp(axs_ldc[0], xlabel="", ylabel='LDC 1', ylim=(0.18, 1.02))
        setp(axs_ldc[1], ylabel='LDC 2', ylim=(0.18, 1.02))
        fig.align_labels()
        return fig


    @property
    def transmission_spectrum_table(self) -> Table:
        """Get the posterior transmission spectrum as an Astropy Table.

        Raises
        ------
        ValueError
            If the MCMC sampler has not been run before calculating the transmission spectrum.
        """
        if self._tsa._mc_chains is None:
            raise ValueError("Cannot calculate posterior transmission spectrum before running the MCMC sampler.")

        pvp = self.posterior_samples
        wls = concatenate(self.data.wavelengths)
        ks = concatenate(self._tsa._eval_k(pvp.values), axis=1)
        ar = ks**2
        ix = argsort(wls)
        return Table(data=[wls[ix]*u.micrometer,
                           median(ks, 0)[ix], ks.std(0)[ix],
                           median(ar, 0)[ix], ar.std(0)[ix]],
                     names = ['wavelength', 'radius_ratio', 'radius_ratio_e', 'area_ratio', 'area_ratio_e'])


[docs]
    def transmission_spectrum_samples(self, wavelengths: ndarray | None = None,
                                      kind: Literal['radius_ratio', 'depth'] = 'depth',
                                      samples: ndarray | None = None) -> tuple[ndarray, ndarray]:
        """Calculate posterior transmission spectrum samples.

        This method computes the posterior samples of the transmission spectrum,
        either as radius ratios or as transit depths, depending on the specified
        kind. It interpolates the data for given wavelengths or uses the
        instrumental wavelength grid if none is provided. Requires that MCMC
        sampling has been performed prior to calling this method.

        Parameters
        ----------
        wavelengths
            The array of wavelengths at which the spectrum should be sampled.
            If None, the default wavelength grid defined by the instrumental data
            will be used.
        kind
            Specifies the desired representation of the transmission spectrum.
            'radius_ratio' returns the spectrum in radius ratio units, while
            'depth' returns the spectrum in transit depth units. Default is 'depth'.
        samples
            Array of posterior samples to use for calculation. If None,
            the method will use previously stored posterior samples.

        Returns
        -------
        ndarray
            Array containing the transmission spectrum samples for the specified
            wavelengths. The representation (radius ratio or depth) depends on the
            specified `kind`.
        """
        if self.mcmc_chains is None and samples is None:
            raise ValueError("Cannot calculate posterior transmission spectrum before running the MCMC sampler.")

        if kind not in ('radius_ratio', 'depth'):
            raise ValueError("Invalid value for `kind`. Must be either 'radius_ratio' or 'depth'.")

        if samples is None:
            samples = self.posterior_samples.values

        if wavelengths is None:
            wavelengths = concatenate(self.data.wavelengths)
            wavelengths.sort()

        k_posteriors = zeros((samples.shape[0], wavelengths.size))
        k_knots = self._tsa.k_knots.copy()
        for i, pv in enumerate(samples):
            if self._tsa.free_k_knot_ids is not None:
                k_knots[self._tsa.free_k_knot_ids] = pv[self._tsa._sl_kloc]
            k_posteriors[i, :] = self._tsa._ip(wavelengths, k_knots, pv[self._tsa._sl_rratios])

        if kind == 'radius_ratio':
            return wavelengths, k_posteriors
        else:
            return wavelengths, k_posteriors**2



[docs]
    def transmission_spectrum(self, wavelengths: ndarray | None = None, kind: Literal['radius_ratio', 'depth'] = 'depth', samples: ndarray | None = None, return_cov: bool = True) -> tuple[ndarray, ndarray]:
        """Compute the transmission spectrum.

        This method calculates the mean transmission spectrum values and the covariance matrix
        (or standard deviations) for the given parameter set. The mean represents the average
        transmission spectrum, and the covariance provides information on the uncertainties and
        correlations between wavelengths or samples.

        Parameters
        ----------
        wavelengths
            Array of wavelength values at which to calculate the transmission spectrum.
            If None, the default grid will be used.
        kind
            Specifies the method to represent the spectrum. 'radius_ratio' computes the
            spectrum in terms of the planet-to-star radius ratio, while 'depth' computes
            the spectrum in terms of transit depth.
        samples
            Array of samples used to compute the spectrum uncertainties. If None, previously
            stored samples will be utilized.

        return_cov : bool, optional
            Indicates whether to return the covariance matrix of the computed transmission
            spectrum. If True, the covariance matrix is returned along with the mean spectrum.
            If False, the standard deviation of the spectrum is returned.

        Returns
        -------
        tuple[ndarray, ndarray]
            A tuple containing two arrays:
            - The mean transmission spectrum.
            - The covariance matrix of the spectrum (if `return_cov` is True), or the
              standard deviation (if `return_cov` is False).
        """
        sp_samples = self.transmission_spectrum_samples(wavelengths, kind, samples)[1]
        mean = sp_samples.mean(0)
        if return_cov:
            return mean, cov(sp_samples, rowvar=False)
        else:
            return mean, sp_samples.std(0)



[docs]
    def save(self, overwrite: bool = False) -> None:
        """Save the ExoIris analysis to a FITS file.

        Parameters
        ----------
        overwrite
            Flag indicating whether to overwrite an existing file with the same name.
        """
        pri = pf.PrimaryHDU()
        pri.header['name'] = self.name
        pri.header['p'] = self.period
        pri.header['t0'] = self.zero_epoch
        pri.header['t14'] = self.transit_duration
        pri.header['ndgroups'] = self.data.size
        pri.header['interp'] = self._tsa.interpolation
        pri.header['interp_ld'] = self._tsa.ld_interpolation
        pri.header['noise'] = self._tsa.noise_model

        if self._tsa.free_k_knot_ids is None:
            pri.header['n_free_k'] = 0
        else:
            pri.header['n_free_k'] = len(self._tsa.free_k_knot_ids)
            for i, ix in enumerate(self._tsa.free_k_knot_ids):
                pri.header[f'kk_ix_{i:03d}'] = ix

        # Priors
        # ======
        pr = pf.ImageHDU(name='priors')
        priors = [pickle.dumps(p) for p in self.ps]
        pr.header['priors'] = json.dumps(codecs.encode(pickle.dumps(priors), "base64").decode())

        # Limb darkening
        # ==============
        if isinstance(self._tsa.ldmodel, LDTkLD):
            ldm = self._tsa.ldmodel
            pri.header['ldmodel'] = 'ldtk'
            pri.header['ldtkld'] = json.dumps(codecs.encode(pickle.dumps((ldm.sc.filters, ldm.sc.teff, ldm.sc.logg,
                                                                          ldm.sc.metal, ldm.dataset)), "base64").decode())
        else:
            pri.header['ldmodel'] = self._tsa.ldmodel

        # Knots
        # =====
        k_knots = pf.ImageHDU(self._tsa.k_knots, name='k_knots')
        ld_knots = pf.ImageHDU(self._tsa.ld_knots, name='ld_knots')
        hdul = pf.HDUList([pri, k_knots, ld_knots, pr])
        hdul += self.data.export_fits()

        # White light curve analysis
        # ==========================
        if self._wa is not None and self._wa._local_minimization is not None:
            wa_data = pf.BinTableHDU(
                Table(
                    [
                        self._wa.lcids,
                        self._wa.timea,
                        concatenate(self.white_models),
                        self._wa.ofluxa,
                        concatenate(self._wa.std_errors),
                    ],
                    names="id time flux_mod flux_obs flux_obs_err".split(),
                ), name='white_data'
            )
            hdul.append(wa_data)

            names = []
            counts = {}
            for p in self._wa.ps.names:
                if p not in counts.keys():
                    counts[p] = 0
                    names.append(p)
                else:
                    counts[p] += 1
                    names.append(f'{p}_{counts[p]}')

            wa_params = pf.BinTableHDU(Table(self._wa._local_minimization.x, names=names), name='white_params')
            hdul.append(wa_params)

        # Spots
        # =====
        if self._tsa.spot_model is not None:
            pri.header['spots'] = True
            pri.header["sp_tstar"] = self._tsa.spot_model.tphot
            pri.header["sp_refwl"] = self._tsa.spot_model.wlref
            pri.header["sp_tlse"] = self._tsa.spot_model.include_tlse
            pri.header["nspots"] = self.nspots
            for i in range(self.nspots):
                pri.header[f"sp{i+1:02d}_eg"] = self._tsa.spot_model.spot_epoch_groups[i]

        # Global optimization results
        # ===========================
        if self._tsa.de is not None:
            de = pf.BinTableHDU(Table(self._tsa._de_population, names=self.ps.names), name='DE')
            de.header['npop'] = self._tsa.de.n_pop
            de.header['ndim'] = self._tsa.de.n_par
            de.header['imin'] = self._tsa.de.minimum_index
            hdul.append(de)

        # MCMC results
        # ============
        if self._tsa.sampler is not None:
            mc = pf.BinTableHDU(Table(self._tsa.sampler.flatchain, names=self.ps.names), name='MCMC')
            mc.header['npop'] = self._tsa.sampler.nwalkers
            mc.header['ndim'] = self._tsa.sampler.ndim
            hdul.append(mc)

        hdul.writeto(f"{self.name}.fits", overwrite=True)



[docs]
    def create_loglikelihood_function(self, wavelengths: ndarray, kind: Literal['radius_ratio', 'depth'] = 'depth',
                                      method: Literal['svd', 'randomized_svd', 'eigh'] = 'svd',
                                      n_max_samples: int = 10000) -> LogLikelihood:
        """Create a reduced-rank Gaussian log-likelihood function for retrieval.

        Parameters
        ----------
        wavelengths
            The wavelength grid used in the theoretical transmission spectra.

        kind
            The transmission spectrum type. Can be either 'radius_ratio' or 'depth'.

        Returns
        -------
        LogLikelihood
            An instance of LogLikelihood for analyzing the consistency of the model
            with the provided wavelengths and chosen log-likelihood kind.
        """
        if self.mcmc_chains is None:
            raise ValueError("Cannot create log-likelihood function before running the MCMC sampler.")
        return LogLikelihood(wavelengths,
                             self.transmission_spectrum_samples(wavelengths, kind)[1],
                             method=method,
                             n_max_samples=n_max_samples,
                             nk=self.nk)



[docs]
    def create_initial_population(self, n: int, source: str, add_noise: bool = True) -> ndarray:
        """Create an initial parameter vector population for the DE optimisation.

        Parameters
        ----------
        n
            Number of parameter vectors in the population.
        source
            Source of the initial population. Must be either 'fit' or 'mcmc'.
        add_noise
            Flag indicating whether to add noise to the initial population. Default is True.

        Returns
        -------
        ndarray
            The initial population.

        Raises
        ------
        ValueError
            If the source is not 'fit' or 'mcmc'.
        """
        return self._tsa.create_initial_population(n, source, add_noise)



[docs]
    def optimize_gp_hyperparameters(self,
                                    log10_sigma_bounds: float | tuple[float, float] | None = None,
                                    log10_rho_bounds: float | tuple[float, float] = (-5, 0),
                                    log10_sigma_prior=None, log10_rho_prior=None,
                                    npop: int = 10, niter: int = 100):
        if self._tsa.noise_model not in ('fixed_gp', 'free_gp'):
            raise ValueError("The noise model must be set to 'fixed_gp' or 'free_gp' before the hyperparameter optimization.")

        if log10_rho_prior is not None:
            if isinstance(log10_rho_prior, Sequence):
                rp = norm(*log10_rho_prior)
            elif hasattr(log10_rho_prior, 'logpdf'):
                rp = log10_rho_prior
            else:
                raise ValueError('Bad rho_prior')
        else:
            rp = norm(-2, 1)

        times = self.white_times
        errors = self.white_errors
        residuals = [o-m for o,m in zip(self.white_fluxes, self.white_models)]
        self.white_gp_models = []

        gp_hyperparameters = []
        for i in range(len(times)):
            time = times[i]
            fres = residuals[i]
            ferr = errors[i]

            log10_sigma_guess = log10(fres.std())

            match log10_sigma_bounds:
                case None:
                    sb = [log10_sigma_guess - 1, log10_sigma_guess + 1]
                case _ if isinstance(log10_sigma_bounds, Sequence):
                    sb = log10_sigma_bounds
                case _ if isinstance(log10_sigma_bounds, float):
                    sb = [log10_sigma_bounds-1, log10_sigma_bounds+1]

            match log10_rho_bounds:
                case None:
                    rb = [-5, -2]
                case _ if isinstance(log10_rho_bounds, Sequence):
                    rb = log10_rho_bounds
                case _ if isinstance(log10_rho_bounds, float):
                    rb = [log10_rho_bounds-1, log10_rho_bounds+1]

            bounds = array([sb, rb])

            if log10_sigma_prior is not None:
                if isinstance(log10_sigma_prior, Sequence):
                    sp = norm(*log10_sigma_prior)
                elif hasattr(log10_sigma_prior, 'logpdf'):
                    sp = log10_sigma_prior
                else:
                    raise ValueError('Bad sigma_prior')
            else:
                sp = norm(log10_sigma_guess, 0.1)

            gp = GaussianProcess(terms.Matern32Term(sigma=fres.std(), rho=0.1))

            def nll(log10x):
                x = 10**log10x
                if any(log10x < bounds[:,0]) or any(log10x > bounds[:,1]):
                    return inf
                gp.kernel = terms.Matern32Term(sigma=x[0], rho=x[1])
                gp.compute(time, yerr=ferr, quiet=True)
                return -(gp.log_likelihood(fres) + sp.logpdf(log10x[0]) + rp.logpdf(log10x[1]))

            de = DiffEvol(nll, bounds, npop, min_ptp=0.2)
            if isinstance(log10_sigma_bounds, float):
                de.population[:, 0] = log10_sigma_bounds
            if isinstance(log10_rho_bounds, float):
                de.population[:, 1] = log10_rho_bounds

            de.optimize(niter)
            x = de.minimum_location
            gp_hyperparameters.append(10**x)
            gp.kernel = terms.Matern32Term(sigma=10**x[0], rho=10**x[1])
            self.white_gp_models.append(gp.predict(fres))
            self._tsa.set_gp_hyperparameters(10**x[0], 10**x[1], i)
        return gp_hyperparameters