Source code for jwspecmcmc.result

"""MCMC result containers.

:class:`MCMCResult` holds the full posterior chains and derived
quantities.  :meth:`MCMCResult.to_fit_result` converts the median
posterior to a :class:`jwspecfit.fitter.FitResult` for compatibility
with :func:`jwspecfit.plotting.plot_fit`.

:class:`MCMCBroadFitResult` wraps an :class:`MCMCResult` with BIC
model-selection metadata for broad Balmer component fitting.
"""

from __future__ import annotations

import logging
from dataclasses import dataclass, field
from math import sqrt, pi
from typing import Any

import numpy as np

from jwspecfit.constraints import ConstraintSet
from jwspecfit.fitter import FitResult, LineResult
from jwspecfit.io import Spectrum, _ujy_to_flam, _flam_to_ujy
from jwspecfit.lines import REST_LINES_A
from jwspecfit.models import build_model

logger = logging.getLogger(__name__)

_SQRT2PI = sqrt(2.0 * pi)



[docs]
@dataclass
class MCMCLineResult:
    """MCMC posterior summary for a single emission line.

    Parameters
    ----------
    name : str
        Line name.
    rest_wave_A : float
        Rest-frame wavelength (Angstrom).
    amplitude : float
        Median posterior amplitude.
    amplitude_err : tuple of float
        (lower, upper) 68% credible interval half-widths on amplitude.
    centroid_A : float
        Median posterior centroid (Angstrom).
    centroid_err : tuple of float
        (lower, upper) 68% CI half-widths on centroid.
    sigma_A : float
        Median posterior sigma (Angstrom).
    sigma_err : tuple of float
        (lower, upper) 68% CI half-widths on sigma.
    flux : float
        Median integrated flux (= amplitude for area-normalised Gaussians).
    flux_err : tuple of float
        (lower, upper) 68% CI half-widths on flux.
    flux_posterior : np.ndarray
        Full flux posterior samples.
    ew_A : float
        Median rest-frame equivalent width (Angstrom).
    snr : float
        Signal-to-noise ratio (flux / mean of flux_err tuple).
    """

    name: str
    rest_wave_A: float
    amplitude: float
    amplitude_err: tuple[float, float]
    centroid_A: float
    centroid_err: tuple[float, float]
    sigma_A: float
    sigma_err: tuple[float, float]
    flux: float
    flux_err: tuple[float, float]
    flux_posterior: np.ndarray
    ew_A: float
    snr: float




[docs]
@dataclass
class MCMCResult:
    """Container for a complete MCMC fitting result.

    Parameters
    ----------
    lines : dict of MCMCLineResult
        Per-line posterior summaries, keyed by line name.
    flat_chains : np.ndarray
        Flattened posterior samples in the **full** parameter space,
        shape ``(n_samples, 3 * n_lines)``.
    flat_chains_free : np.ndarray
        Flattened posterior samples in the **free** parameter space,
        shape ``(n_samples, n_free)``.
    flat_log_prob : np.ndarray
        Log-posterior for each sample.
    chains : np.ndarray or None
        Raw chains of shape ``(n_walkers, n_steps, n_free)`` (emcee)
        or ``None`` (nautilus).
    params : np.ndarray
        Median posterior in the full parameter space.
    model_flux : np.ndarray
        Median model flux (µJy, continuum-subtracted).
    continuum : np.ndarray
        Continuum estimate (µJy).
    spectrum : Spectrum
        Input spectrum.
    line_names : list of str
        Ordered line names.
    constraints : ConstraintSet
        Applied constraints.
    convergence : dict
        Convergence diagnostics (R-hat, ESS).
    sampler_name : str
        Name of the sampler used (``"emcee"`` or ``"nautilus"``).
    sampler_meta : dict
        Additional sampler metadata (n_walkers, n_steps, etc.).
    """

    lines: dict[str, MCMCLineResult]
    flat_chains: np.ndarray
    flat_chains_free: np.ndarray
    flat_log_prob: np.ndarray
    chains: np.ndarray | None
    params: np.ndarray
    model_flux: np.ndarray
    continuum: np.ndarray
    spectrum: Spectrum
    line_names: list[str] = field(default_factory=list)
    constraints: ConstraintSet | None = None
    convergence: dict[str, Any] = field(default_factory=dict)
    sampler_name: str = ""
    sampler_meta: dict[str, Any] = field(default_factory=dict)
    lya_params: np.ndarray | None = None  # [A_peak, mu, sigma, alpha]


[docs]
    def to_fit_result(self) -> FitResult:
        """Convert to a :class:`jwspecfit.fitter.FitResult`.

        Uses the median posterior as the best fit and the mean of the
        asymmetric 68% CI as the symmetric flux error.

        Returns
        -------
        FitResult
        """
        # Convert median model to residuals.
        spec = self.spectrum
        resid_ujy = spec.flux_ujy - self.continuum - self.model_flux

        # Reduced chi-squared from median model.
        flam = _ujy_to_flam(spec.flux_ujy - self.continuum, spec.wave_um)
        flam_err = _ujy_to_flam(spec.err_ujy, spec.wave_um)
        model_flam = _ujy_to_flam(self.model_flux, spec.wave_um)
        valid = np.isfinite(flam) & np.isfinite(flam_err) & (flam_err > 0)
        r = np.zeros_like(flam)
        r[valid] = (flam[valid] - model_flam[valid]) / flam_err[valid]
        n_data = np.sum(valid)
        n_free = self.flat_chains_free.shape[1] if self.flat_chains_free.ndim == 2 else 0
        dof = max(n_data - n_free, 1)
        chi2_red = float(np.nansum(r**2)) / dof

        line_results = {}
        for name, mlr in self.lines.items():
            # Symmetric flux error = mean of asymmetric CI half-widths.
            flux_err_sym = 0.5 * (mlr.flux_err[0] + mlr.flux_err[1])
            line_results[name] = LineResult(
                name=mlr.name,
                rest_wave_A=mlr.rest_wave_A,
                amplitude=mlr.amplitude,
                centroid_A=mlr.centroid_A,
                sigma_A=mlr.sigma_A,
                flux=mlr.flux,
                flux_err=flux_err_sym,
                ew_A=mlr.ew_A,
                snr_int_err=mlr.snr,
                snr_int_cont=0.0,
                snr_peak_err=0.0,
                snr_peak_cont=0.0,
            )

        return FitResult(
            lines=line_results,
            params=self.params,
            model_flux=self.model_flux,
            continuum=self.continuum,
            residuals=resid_ujy,
            chi2=chi2_red,
            spectrum=spec,
            line_names=self.line_names,
            constraints=self.constraints,
            success=True,
            lya_params=self.lya_params,
        )



[docs]
    def doublet_flux_posterior(
        self,
        line_a: str,
        line_b: str,
    ) -> np.ndarray:
        """Compute the combined flux posterior for a doublet.

        Sums the flux posteriors sample-by-sample, giving the correct
        combined distribution even when individual members are degenerate
        (e.g. blended CIII] 1907+1909).

        Parameters
        ----------
        line_a : str
            First doublet member.
        line_b : str
            Second doublet member.

        Returns
        -------
        np.ndarray
            Posterior samples of ``flux(line_a) + flux(line_b)``.
        """
        if line_a not in self.lines:
            raise KeyError(f"Line '{line_a}' not found in result.")
        if line_b not in self.lines:
            raise KeyError(f"Line '{line_b}' not found in result.")
        return self.lines[line_a].flux_posterior + self.lines[line_b].flux_posterior



[docs]
    def doublet_snr(
        self,
        line_a: str,
        line_b: str,
    ) -> float:
        """Compute the SNR of a combined doublet flux.

        Uses the summed flux posterior to get a single SNR that is not
        degraded by the amplitude degeneracy between blended members.

        Parameters
        ----------
        line_a : str
            First doublet member.
        line_b : str
            Second doublet member.

        Returns
        -------
        float
            SNR of the combined doublet.
        """
        combined = self.doublet_flux_posterior(line_a, line_b)
        med = float(np.median(combined))
        lo = med - float(np.percentile(combined, 16))
        hi = float(np.percentile(combined, 84)) - med
        mean_err = 0.5 * (lo + hi)
        return med / mean_err if mean_err > 0 else 0.0



[docs]
    def flux_upper_limit(
        self,
        line_name: str,
        n_sigma: float = 3.0,
    ) -> float | None:
        """Compute a noise-based flux upper limit for a line.

        Uses the local RMS of the continuum-and-model-subtracted
        residuals near the line, multiplied by the line width and
        *n_sigma*.  This is the standard approach for non-detections
        and is independent of the posterior (which may be prior-
        dominated for weak lines).

        Parameters
        ----------
        line_name : str
            Line name.
        n_sigma : float
            Number of sigma for the upper limit (default 3).

        Returns
        -------
        float or None
            Integrated flux upper limit in f_lam units, or ``None``
            if there are insufficient pixels near the line.
        """
        if line_name not in self.lines:
            raise KeyError(f"Line '{line_name}' not found in result.")

        lr = self.lines[line_name]
        spec = self.spectrum

        # Residuals in f_lam: data - continuum - model.
        from jwspecfit.io import _ujy_to_flam
        data_flam = _ujy_to_flam(spec.flux_ujy, spec.wave_um)
        cont_flam = _ujy_to_flam(self.continuum, spec.wave_um)
        model_flam = _ujy_to_flam(self.model_flux, spec.wave_um)
        resid = data_flam - cont_flam - model_flam
        valid = np.isfinite(resid)

        wave_A = spec.wave_A
        lam_obs = lr.centroid_A
        sig_line = lr.sigma_A

        # Window: ±5σ around line, excluding central ±2σ.
        near = np.abs(wave_A - lam_obs)
        window = valid & (near < 5.0 * sig_line) & (near > 2.0 * sig_line)
        if int(np.sum(window)) < 3:
            window = valid & (near < 10.0 * sig_line)
        if int(np.sum(window)) < 3:
            return None

        rms = float(np.sqrt(np.nanmean(resid[window] ** 2)))
        return n_sigma * rms * sig_line * _SQRT2PI



[docs]
    def flux_upper_limits(
        self,
        line_names: list[str] | None = None,
        n_sigma: float = 3.0,
        snr_threshold: float = 3.0,
    ) -> dict[str, float]:
        """Compute noise-based upper limits for low-SNR lines.

        Parameters
        ----------
        line_names : list of str, optional
            Lines to check.  If ``None``, checks all fitted lines.
        n_sigma : float
            Number of sigma for the upper limit (default 3).
        snr_threshold : float
            Only compute upper limits for lines with SNR below this
            (default 3.0).  Lines above this threshold are detections.

        Returns
        -------
        dict of {str: float}
            ``{line_name: flux_upper_limit}`` for each line below
            the SNR threshold.
        """
        names = line_names if line_names is not None else list(self.lines.keys())
        uls: dict[str, float] = {}
        for name in names:
            if name not in self.lines:
                continue
            if self.lines[name].snr >= snr_threshold:
                continue
            ul = self.flux_upper_limit(name, n_sigma=n_sigma)
            if ul is not None:
                uls[name] = ul
        return uls



[docs]
    def flux_ratio_posterior(
        self,
        line_a: str,
        line_b: str,
    ) -> np.ndarray:
        """Compute the posterior distribution of a flux ratio.

        Parameters
        ----------
        line_a : str
            Numerator line name.
        line_b : str
            Denominator line name.

        Returns
        -------
        np.ndarray
            Posterior samples of ``flux(line_a) / flux(line_b)``.

        Raises
        ------
        KeyError
            If either line is not in the result.
        """
        if line_a not in self.lines:
            raise KeyError(f"Line '{line_a}' not found in result.")
        if line_b not in self.lines:
            raise KeyError(f"Line '{line_b}' not found in result.")

        flux_a = self.lines[line_a].flux_posterior
        flux_b = self.lines[line_b].flux_posterior

        # Avoid division by zero: mask samples where denominator is non-positive.
        with np.errstate(divide="ignore", invalid="ignore"):
            ratio = np.where(flux_b > 0, flux_a / flux_b, np.nan)
        return ratio





[docs]
@dataclass
class MCMCBroadFitResult:
    """MCMC result with BIC-based broad Balmer component selection.

    Wraps an :class:`MCMCResult` (full MCMC posteriors on the winning
    model) together with BIC model-selection metadata.

    Parameters
    ----------
    mcmc_result : MCMCResult
        Full MCMC posteriors for the selected model.
    selected_model : str
        Model name: ``"narrow"``, ``"broad1"``, ``"broad2"``, or ``"both"``.
    bic_narrow : float
        BIC for narrow-only model.
    bic_broad1 : float
        BIC for narrow + intermediate broad model (NaN if not attempted).
    bic_broad2 : float
        BIC for narrow + very broad model (NaN if not attempted).
    bic_both : float
        BIC for narrow + both broad components (NaN if not attempted).
    """

    mcmc_result: MCMCResult
    selected_model: str
    bic_narrow: float
    bic_broad1: float
    bic_broad2: float
    bic_both: float
    # Independent [OIII] outflow component selection.  Mirrors the
    # Balmer fields: oiii_selected is one of "off" / "broad1" /
    # "broad2" / "both"; the matching OIII broad lines (e.g.
    # ``OIII_5007_BROAD``, ``OIII_4959_BROAD2``) appear in the MCMC
    # posteriors when selected.
    oiii_selected: str = "off"
    bic_oiii_off: float = float("nan")
    bic_oiii_broad1: float = float("nan")
    bic_oiii_broad2: float = float("nan")
    bic_oiii_both: float = float("nan")
    # He I broad component selection — same shape as OIII.  Within each
    # tier, all observable HeI broads share kinematics (anchored on the
    # first present in HEI_BROAD_CANDIDATES).
    hei_selected: str = "off"
    bic_hei_off: float = float("nan")
    bic_hei_broad1: float = float("nan")
    bic_hei_broad2: float = float("nan")
    bic_hei_both: float = float("nan")

    @property
    def oiii_broad_selected(self) -> bool:
        """Convenience: True if any OIII broad component was selected."""
        return self.oiii_selected != "off"

    @property
    def hei_broad_selected(self) -> bool:
        """Convenience: True if any HeI broad component was selected."""
        return self.hei_selected != "off"

    # Delegate all MCMCResult attributes for full API compatibility.

    @property
    def lines(self) -> dict[str, MCMCLineResult]:
        """Per-line posterior summaries."""
        return self.mcmc_result.lines

    @property
    def flat_chains(self) -> np.ndarray:
        """Flattened posterior samples (full parameter space)."""
        return self.mcmc_result.flat_chains

    @property
    def flat_chains_free(self) -> np.ndarray:
        """Flattened posterior samples (free parameter space)."""
        return self.mcmc_result.flat_chains_free

    @property
    def flat_log_prob(self) -> np.ndarray:
        """Log-posterior for each sample."""
        return self.mcmc_result.flat_log_prob

    @property
    def chains(self) -> np.ndarray | None:
        """Raw walker chains (emcee) or None (nautilus)."""
        return self.mcmc_result.chains

    @property
    def params(self) -> np.ndarray:
        """Median posterior in the full parameter space."""
        return self.mcmc_result.params

    @property
    def model_flux(self) -> np.ndarray:
        """Median model flux (continuum-subtracted)."""
        return self.mcmc_result.model_flux

    @property
    def continuum(self) -> np.ndarray:
        """Continuum estimate."""
        return self.mcmc_result.continuum

    @property
    def spectrum(self) -> Spectrum:
        """Input spectrum."""
        return self.mcmc_result.spectrum

    @property
    def line_names(self) -> list[str]:
        """Ordered line names."""
        return self.mcmc_result.line_names

    @property
    def constraints(self) -> ConstraintSet | None:
        """Applied constraints."""
        return self.mcmc_result.constraints

    @property
    def convergence(self) -> dict[str, Any]:
        """Convergence diagnostics."""
        return self.mcmc_result.convergence

    @property
    def sampler_name(self) -> str:
        """Name of the sampler used."""
        return self.mcmc_result.sampler_name

    @property
    def sampler_meta(self) -> dict[str, Any]:
        """Additional sampler metadata."""
        return self.mcmc_result.sampler_meta


[docs]
    def to_fit_result(self) -> FitResult:
        """Convert to a :class:`jwspecfit.fitter.FitResult`.

        Delegates to :meth:`MCMCResult.to_fit_result`.

        Returns
        -------
        FitResult
        """
        return self.mcmc_result.to_fit_result()



[docs]
    def doublet_flux_posterior(self, line_a: str, line_b: str) -> np.ndarray:
        """Combined flux posterior for a doublet.

        Delegates to :meth:`MCMCResult.doublet_flux_posterior`.
        """
        return self.mcmc_result.doublet_flux_posterior(line_a, line_b)



[docs]
    def doublet_snr(self, line_a: str, line_b: str) -> float:
        """SNR of a combined doublet flux.

        Delegates to :meth:`MCMCResult.doublet_snr`.
        """
        return self.mcmc_result.doublet_snr(line_a, line_b)



[docs]
    def flux_upper_limit(self, line_name: str, n_sigma: float = 3.0) -> float | None:
        """Noise-based flux upper limit for a line.

        Delegates to :meth:`MCMCResult.flux_upper_limit`.
        """
        return self.mcmc_result.flux_upper_limit(line_name, n_sigma=n_sigma)



[docs]
    def flux_upper_limits(
        self, line_names: list[str] | None = None,
        n_sigma: float = 3.0, snr_threshold: float = 3.0,
    ) -> dict[str, float]:
        """Noise-based upper limits for low-SNR lines.

        Delegates to :meth:`MCMCResult.flux_upper_limits`.
        """
        return self.mcmc_result.flux_upper_limits(
            line_names=line_names, n_sigma=n_sigma, snr_threshold=snr_threshold,
        )



[docs]
    def flux_ratio_posterior(self, line_a: str, line_b: str) -> np.ndarray:
        """Compute the posterior distribution of a flux ratio.

        Delegates to :meth:`MCMCResult.flux_ratio_posterior`.

        Parameters
        ----------
        line_a : str
            Numerator line name.
        line_b : str
            Denominator line name.

        Returns
        -------
        np.ndarray
            Posterior samples of ``flux(line_a) / flux(line_b)``.
        """
        return self.mcmc_result.flux_ratio_posterior(line_a, line_b)