Source code for unite.model

"""Model builder and numpyro model function for spectral line fitting.

The :class:`ModelBuilder` assembles a :class:`~unite.line.config.LineConfiguration`,
an optional :class:`~unite.continuum.config.ContinuumConfiguration`, and a
:class:`~unite.spectrum.spectrum.Spectra` collection into a numpyro model
function that can be passed to any numpyro inference algorithm (NUTS, SVI, etc.).
"""

from __future__ import annotations

import math
import warnings
from collections.abc import Callable
from dataclasses import dataclass, field
from typing import Any, cast

import jax
import jax.numpy as jnp
import numpyro
from astropy import units as u
from numpyro import distributions as dist

from unite._compose import compose_from_profiles
from unite._lsf import _FWHM_TO_SIGMA
from unite._utils import _get_conversion_factor
from unite.continuum.compute import eval_continuum, integrate_continuum
from unite.continuum.config import ContinuumConfiguration
from unite.line.compute import (
    _build_line_params,
    _peak_to_area_tau,
    evaluate_lines,
    integrate_lines,
)
from unite.line.config import ConfigMatrices, LineConfiguration
from unite.prior import Fixed, Parameter, Prior, topological_sort
from unite.spectrum import Spectra, Spectrum

# Gaussian kernel half-width in sigma units for the banded LSF convolution.
# 4 sigma captures >99.99% of the Gaussian area; increasing this has diminishing returns.
_LSF_TRUNCATION_SIGMA: float = 4.0

# ------------------------------------------------------------------
# ModelArgs — data bundle for the numpyro model function
# ------------------------------------------------------------------



[docs]
@dataclass
class ModelArgs:
    """Bundle of arguments passed to :func:`unite_model`.

    Created by :meth:`ModelBuilder.build`; not intended for direct
    construction by users.
    """

    #: Precomputed parameter matrices and line metadata.
    matrices: ConfigMatrices
    #: Individual spectra.
    spectra: list[Spectrum]
    #: Systemic redshift.
    redshift: float
    #: Continuum configuration, or ``None`` if not used.
    cont_config: ContinuumConfiguration | None
    #: Resolved ``{param_name: ContinuumParam}`` mappings per region, from :attr:`ContinuumConfiguration.resolved_params`.
    cont_resolved_params: list[dict[str, Parameter]] | None
    #: All parameters with their priors (line, calibration, continuum).
    all_priors: dict[str, Prior]
    #: Topological sampling order for all parameters.
    dependency_order: list[str]
    name_to_token: dict[str, object]
    # --- Wavelength unit conversion ---
    spec_to_canonical: list[float]
    # --- Pre-converted continuum bounds (rest-frame, canonical unit) ---
    cont_low: list[float] | None
    cont_high: list[float] | None
    cont_center: list[float] | None
    # --- Unit conversion factors: region.unit → canonical unit, per region ---
    cont_nw_conv: list[float] | None
    #: Pre-converted continuum forms (static wavelength config in canonical unit).
    cont_forms: list | None
    # --- Flux normalization ---
    norm_factors: list[float]
    #: Per-spectrum line flux scale (in each spectrum's flux_unit * canonical_wl_unit).
    line_flux_scales: list[float]
    #: Per-spectrum continuum scale (in each spectrum's flux_unit).
    continuum_scales: list[float]
    #: Wavelength unit of canonical frame (first spectrum's disperser unit).
    canonical_unit: object
    #: Per-spectrum flux density units.
    flux_units: list
    #: The Quantity line_scale and continuum_scale from Spectra (for results output).
    line_scale_quantity: u.Quantity | None
    continuum_scale_quantity: u.Quantity | None
    #: Human-readable column labels for each line, parallel to ``matrices.wavelengths``.
    #: Derived from user-supplied line names and rest-frame wavelengths.
    line_labels: list[str]
    #: Human-readable column labels for each continuum region, parallel to ``cont_config``.
    #: Derived from form type and wavelength bounds.
    continuum_labels: list[str]
    #: Boolean mask: which tau lines (by line index) attenuate the continuum.
    #: ``cont_applies[k]`` is True when ``line_zorders[k] > cont_zorder`` and ``is_tau[k]``.
    #: Shape ``(n_lines,)``.
    cont_applies: jnp.ndarray
    #: Line integration mode: ``'analytic'`` (default) uses exact CDF-based
    #: integration for all line profiles individually; ``'convolution'``
    #: evaluates the intrinsic model on a fine sub-pixel grid and numerically
    #: convolves with the wavelength-dependent Gaussian LSF.
    integration_mode: str = 'analytic'
    #: Number of uniform sub-pixel evaluation points per pixel for convolution mode.
    #: ``None`` when ``integration_mode != 'convolution'``.
    n_super: int | None = None
    #: Half-width of the banded LSF convolution kernel in fine-grid indices.
    #: Pre-computed at build time as a Python ``int`` (not a traced value).
    #: ``None`` when ``integration_mode != 'convolution'``.
    conv_half_width: int | None = None
    #: Per-spectrum JIT'd vmapped evaluators, built lazily by :func:`~unite.compute.evaluate_model`.
    #: Cached so that repeated calls with the same :class:`ModelArgs` skip Python-level retracing.
    _evaluators: list[Any] | None = field(default=None, compare=False, repr=False)
    #: Remapped profile codes (0-based into the specialized branch lists below).
    #: None when specialization is not active (all profiles used or no lines).
    _profile_codes_local: Any | None = field(default=None, compare=False, repr=False)
    #: Specialized vmapped integrate function (only used-profile branches compiled).
    _integrate_fn: Any | None = field(default=None, compare=False, repr=False)
    #: Specialized vmapped evaluate function.
    _evaluate_fn: Any | None = field(default=None, compare=False, repr=False)
    #: Specialized vmapped evaluate-at-own-centers function (used by _peak_to_area_tau).
    _evaluate_at_centers_fn: Any | None = field(default=None, compare=False, repr=False)

    def __len__(self) -> int:
        """Return the number of spectra in the model."""
        return len(self.spectra)

    def __bool__(self) -> bool:
        """Return True if the model has at least one spectrum."""
        return len(self.spectra) > 0



# ------------------------------------------------------------------
# Specialized profile dispatch
# ------------------------------------------------------------------


def _make_specialized_dispatch(profile_codes: jnp.ndarray) -> tuple[Any, Any, Any, Any]:
    """Build per-config vmapped dispatch functions with only used profile branches.

    Returns ``(profile_codes_local, integrate_fn, evaluate_fn, evaluate_at_centers_fn)``.
    When fewer than all registered profiles are used, the returned functions wrap
    ``lax.switch`` over only the needed branches — reducing XLA graph size and
    compile time proportionally to the fraction of unused profiles.
    """
    from unite.line.compute import (
        evaluate_lines,
        evaluate_lines_at_own_centers,
        integrate_lines,
    )
    from unite.line.library import _EVALUATE_BRANCHES, _INTEGRATE_BRANCHES

    n_all = len(_INTEGRATE_BRANCHES)
    if len(profile_codes) == 0:
        return (
            profile_codes,
            integrate_lines,
            evaluate_lines,
            evaluate_lines_at_own_centers,
        )

    used_codes = sorted({int(c) for c in profile_codes})

    if len(used_codes) == n_all:
        return (
            profile_codes,
            integrate_lines,
            evaluate_lines,
            evaluate_lines_at_own_centers,
        )

    code_to_local = {code: idx for idx, code in enumerate(used_codes)}
    local_codes = jnp.array([code_to_local[int(c)] for c in profile_codes])
    int_branches = [_INTEGRATE_BRANCHES[c] for c in used_codes]
    eval_branches = [_EVALUATE_BRANCHES[c] for c in used_codes]

    def _int_single(edges, center, lsf_fwhm, p0, p1, p2, code):
        return jax.lax.switch(code, int_branches, edges, center, lsf_fwhm, p0, p1, p2)

    def _eval_single(wavelength, center, lsf_fwhm, p0, p1, p2, code):
        return jax.lax.switch(
            code, eval_branches, wavelength, center, lsf_fwhm, p0, p1, p2
        )

    spec_integrate = jax.vmap(_int_single, in_axes=(None, 0, None, 0, 0, 0, 0))
    spec_evaluate = jax.vmap(_eval_single, in_axes=(None, 0, 0, 0, 0, 0, 0))
    spec_eval_centers = jax.vmap(_eval_single, in_axes=(0, 0, 0, 0, 0, 0, 0))

    return local_codes, spec_integrate, spec_evaluate, spec_eval_centers


# ------------------------------------------------------------------
# Numpyro model function
# ------------------------------------------------------------------



[docs]
def unite_model(args: ModelArgs) -> None:
    """Numpyro model function for multi-spectrum emission-line fitting.

    All lines are integrated simultaneously via :func:`jax.vmap` with
    ``lax.switch`` dispatching to the correct profile kernel per line.
    Parameter broadcasting from unique tokens to per-line arrays is done
    with precomputed indicator matrices.

    Wavelength unit conversion is handled via pre-computed scalar factors
    stored in ``args.spec_to_canonical`` (one per spectrum).  Flux is
    normalized per spectrum so that the likelihood operates on O(1) values.

    Parameters
    ----------
    args : ModelArgs
        Pre-built data bundle from :meth:`ModelBuilder.build`.
    """
    cm = args.matrices
    z_sys = args.redshift
    n_lines = cm.wavelengths.shape[0]
    has_tau = bool(cm.tau_names)

    # Resolve per-config dispatch functions (fall back to module-level if not set).
    _pcodes = (
        args._profile_codes_local
        if args._profile_codes_local is not None
        else cm.profile_codes
    )
    _int_fn = args._integrate_fn if args._integrate_fn is not None else integrate_lines
    _eval_fn = args._evaluate_fn if args._evaluate_fn is not None else evaluate_lines

    # --- 1. Sample all parameters in dependency order ---
    # Two parallel dicts are maintained:
    #   context    — str → value, used for all downstream name-based lookups.
    #   obj_ctx    — token_object → value, passed to prior.to_dist() so that
    #                parameter expressions can look up dependency values by
    #                token identity.
    context: dict[str, jnp.ndarray] = {}
    obj_ctx: dict[object, jnp.ndarray] = {}
    for pname in args.dependency_order:
        prior = args.all_priors[pname]
        if isinstance(prior, Fixed):
            val: jnp.ndarray = jnp.asarray(prior.resolved_value(obj_ctx))
        else:
            distribution = prior.to_dist(obj_ctx)
            assert distribution is not None
            val = cast(jnp.ndarray, numpyro.sample(pname, distribution))
        context[pname] = val
        tok = args.name_to_token.get(pname)
        if tok is not None:
            obj_ctx[tok] = val

    # --- 2. Per-line parameter arrays via matrix products ---
    flux_per_line, tau_per_line, centers, p0, p1, p2 = _build_line_params(
        cm, context, n_lines, z_sys
    )

    # --- 2b. Convert peak-tau to area-tau ---
    if cm.tau_names:
        tau_per_line = _peak_to_area_tau(
            tau_per_line,
            centers,
            p0,
            p1,
            p2,
            _pcodes,
            cm.is_tau,
            _eval_fn=args._evaluate_at_centers_fn,
        )

    # --- 3. Per-spectrum likelihood ---
    for i, spectrum in enumerate(args.spectra):
        disp = spectrum.disperser
        wl_scale = args.spec_to_canonical[i]
        inv_wl_scale = 1.0 / wl_scale
        norm = args.norm_factors[i]
        lfs = args.line_flux_scales[i]
        cs = args.continuum_scales[i]

        # Calibration values (every disperser always carries these tokens).
        r_scale = context[disp.r_scale.name]
        flux_scale = context[disp.flux_scale.name]
        pix_offset = context[disp.pix_offset.name]

        # Edge topology (canonical wavelength unit) — shared by all lines.
        edges = spectrum.edges * wl_scale  # (E,)
        keep_mask = spectrum.keep_mask  # (E-1,)
        edges = edges - (pix_offset * disp.dlam_dpix(spectrum.edges) * wl_scale)
        widths = jnp.diff(edges)  # (E-1,)

        # Scaled line fluxes and continuum for this spectrum.
        scaled_flux = flux_per_line * lfs / norm
        cont_scale_norm = cs / norm

        # --- Compute pixel-averaged model ---
        if args.integration_mode == 'convolution':
            # Numerical LSF convolution: evaluate the intrinsic model (lsf_fwhm=0)
            # on a uniform fine sub-pixel grid, convolve with the wavelength-
            # dependent Gaussian LSF, then pixel-average.  This correctly computes
            # LSF ⊗ [F · exp(-τ · φ_intrinsic)] rather than F · exp(-τ · LSF ⊗ φ).
            from unite._lsf import _lsf_convolve

            n_super = args.n_super
            half_width = args.conv_half_width
            assert n_super is not None
            assert half_width is not None

            # Per-pixel low/high — needed only by convolution.
            low = edges[:-1][keep_mask]
            high = edges[1:][keep_mask]
            n_pixels = low.shape[0]

            # Fine grid: n_super uniform points per pixel, midpoints of sub-bins.
            # Transposed to wavelength order: all sub-bins of pixel 0, then pixel 1, etc.
            # Shape: (n_pixels * n_super,).
            offsets = (jnp.arange(n_super) + 0.5) / n_super  # (n_super,)
            x_fine = (
                low[None, :] + offsets[:, None] * (high - low)[None, :]
            )  # (n_super, n_pixels)
            x_flat = x_fine.T.ravel()  # (n_pixels * n_super,) in wavelength order

            # Evaluate intrinsic model (lsf_fwhm=0) on fine grid.
            # _combine_fwhm(0, fwhm) = fwhm, so intrinsic profiles are used.
            zero_lsf = jnp.zeros_like(centers)

            def _conv_eval(
                wav,
                *,
                _zero_lsf=zero_lsf,
                _scaled_flux=scaled_flux,
                _csn=cont_scale_norm,
                _efn=_eval_fn,
                _pc=_pcodes,
            ):
                phi = _efn(wav, centers, _zero_lsf, p0, p1, p2, _pc)
                cont = eval_continuum(wav, args, context, z_sys, 0.0) * _csn
                return compose_from_profiles(
                    phi,
                    _scaled_flux,
                    tau_per_line,
                    cm.is_tau,
                    cm.applies_matrix,
                    args.cont_applies,
                    cont,
                    has_tau=has_tau,
                )

            model_fine_intrinsic = _conv_eval(x_flat)  # (n_pixels * n_super,)

            # LSF sigma at each fine-grid point.
            sigma_fine = (
                x_flat / (disp.R(x_flat * inv_wl_scale) * r_scale) * _FWHM_TO_SIGMA
            )

            # Convolve on the fine grid, then pixel-average.
            model_fine_conv = _lsf_convolve(
                x_flat, model_fine_intrinsic, sigma_fine, half_width
            )
            model_pix = model_fine_conv.reshape(n_pixels, n_super).mean(axis=1)
            model = flux_scale * model_pix
        else:
            # Analytic: each profile's cumulative-at-edges array, then diff
            # → per-interval integral → mask off inter-pixel-gap entries →
            # divide by widths → pixel-averaged profile.
            # Per-edge LSF (length E, shared across all lines of this spectrum).
            lsf_at_edges = edges / (disp.R(edges * inv_wl_scale) * r_scale)

            cum_per_line = _int_fn(
                edges, centers, lsf_at_edges, p0, p1, p2, _pcodes
            )  # (n_lines, E)
            per_interval = jnp.diff(cum_per_line, axis=1) / widths  # (n_lines, E-1)
            pixints = per_interval[:, keep_mask]  # (n_lines, npix)

            # Per-region LSF FWHM (scalar per region) for polynomial-based
            # continuum forms' analytic Gaussian-moment convolution.
            if args.cont_config is not None and args.cont_center is not None:
                cont_centers_obs = jnp.array(args.cont_center) * (1.0 + z_sys)
                cont_lsf_per_region = cont_centers_obs / (
                    disp.R(cont_centers_obs * inv_wl_scale) * r_scale
                )
            else:
                cont_lsf_per_region = jnp.zeros(0)
            cont_per_interval = integrate_continuum(
                edges, args, context, z_sys, cont_lsf_per_region
            )  # (E-1,)
            cont = cont_per_interval[keep_mask] * cont_scale_norm  # (npix,)

            model = flux_scale * compose_from_profiles(
                pixints,
                scaled_flux,
                tau_per_line,
                cm.is_tau,
                cm.applies_matrix,
                args.cont_applies,
                cont,
                has_tau=has_tau,
            )
        obs_name = f'obs_{spectrum.name}' if spectrum.name else f'obs_{i}'
        numpyro.sample(
            obs_name,
            dist.Normal(model, spectrum.scaled_error / norm),
            obs=spectrum.flux / norm,
        )



# ------------------------------------------------------------------
# ModelBuilder
# ------------------------------------------------------------------



[docs]
class ModelBuilder:
    """Assemble configuration objects into a numpyro model.

    Collects all unique parameter tokens (line, calibration, continuum),
    builds precomputed indicator matrices, performs a topological sort for
    dependency resolution, and packages everything into a
    ``(model_fn, model_args)`` pair.

    Parameters
    ----------
    line_config : LineConfiguration or None
        Emission/absorption line configuration.  Handling depends on whether
        ``spectra`` has already been prepared (see Notes):

        - If ``spectra`` is **not** prepared, ``line_config`` is required and is
          passed to :py:meth:`~unite.spectrum.Spectra.prepare` for coverage
          filtering.  ``None`` raises ``ValueError``.
        - If ``spectra`` is already prepared, a non-``None`` ``line_config`` is
          used **verbatim** (no re-filtering); ``None`` falls back to the stored
          :py:attr:`~unite.spectrum.Spectra.prepared_line_config`.
    continuum_config : ContinuumConfiguration or None
        Continuum configuration, handled independently of ``line_config``:

        - If ``spectra`` is **not** prepared, it is passed to
          :py:meth:`~unite.spectrum.Spectra.prepare`; ``None`` means a
          lines-only model.
        - If ``spectra`` is already prepared, a non-``None`` value is used
          **verbatim**; ``None`` falls back to the stored
          :py:attr:`~unite.spectrum.Spectra.prepared_cont_config` (which may
          itself be ``None`` for a lines-only model).
    spectra : Spectra
        Spectrum collection with systemic redshift.

    Notes
    -----
    Coverage filtering (dropping lines/regions outside the spectral coverage,
    and optionally empty continuum regions) happens **only** during the first
    :py:meth:`~unite.spectrum.Spectra.prepare`.  Once ``spectra`` is prepared,
    configs passed to ``ModelBuilder`` are taken at face value and are **not**
    re-filtered — the caller is responsible for their coverage correctness.
    To re-filter (e.g. with different ``drop_empty_regions``), call
    ``spectra.prepare(...)`` again before constructing the builder.

    Examples
    --------
    >>> model_fn, args = ModelBuilder(line_config, cont, spectra).build()
    >>> kernel = numpyro.infer.NUTS(model_fn)
    >>> mcmc = numpyro.infer.MCMC(kernel, num_warmup=500, num_samples=1000)
    >>> mcmc.run(jax.random.PRNGKey(0), args)
    """

    def __init__(
        self,
        line_config: LineConfiguration | None,
        continuum_config: ContinuumConfiguration | None,
        spectra: Spectra,
    ) -> None:
        self._spectra = spectra

        if not spectra.is_prepared:
            # First preparation: a line_config is required so we can coverage-
            # filter.  continuum_config (possibly None for a lines-only model)
            # rides along into prepare().
            if line_config is None:
                raise ValueError(
                    'No line_config supplied and spectra has not been prepared. '
                    'Either pass line_config to ModelBuilder or call '
                    'spectra.prepare(line_config, continuum_config) first.'
                )
            line_config, continuum_config = spectra.prepare(
                line_config, continuum_config
            )
        else:
            # Already prepared: explicitly passed configs win and are used
            # verbatim (no re-filtering — the caller owns coverage correctness).
            # Each config omitted (None) falls back independently to the
            # prepared one.
            if line_config is None:
                prepared_lc = spectra.prepared_line_config
                assert prepared_lc is not None, (
                    'prepared_line_config is None despite is_prepared=True'
                )
                line_config = prepared_lc
            if continuum_config is None:
                continuum_config = spectra.prepared_cont_config

        # --- Auto-compute scales if needed ---
        if spectra.line_scale is None:
            warnings.warn(
                'Line scale not set; calling spectra.compute_scales() with '
                'defaults. Call spectra.compute_scales(line_config, '
                'continuum_config) explicitly for full control.',
                UserWarning,
                stacklevel=2,
            )
            spectra.compute_scales(line_config, continuum_config)

        self._cont_config = continuum_config

        # --- Canonical wavelength unit: use Spectra's canonical_unit ---
        self._canonical_unit = spectra.canonical_unit

        # Build precomputed matrices from line entries.
        self._matrices = line_config.build_matrices()

        # Convert line wavelengths to canonical unit.
        # Each line may have a different Quantity unit, so convert per-line.
        if len(line_config) > 0:
            canon_wls = jnp.array(
                [
                    float(e.wavelength.to(self._canonical_unit).value)
                    for e in line_config._entries
                ]
            )
            self._matrices.wavelengths = canon_wls

        # --- Collect all unique parameter tokens for prior / topo-sort ---
        all_priors: dict[str, Prior] = dict(self._matrices.priors)
        param_to_name: dict[object, str] = {
            # We can reconstruct token→name from the matrices' name lists and
            # the original entries since tokens carry their .name attribute.
            tok: tok.name
            for entry in line_config._entries
            for tok in (entry.flux, entry.tau, entry.redshift, *entry.fwhms.values())
            if tok is not None
        }

        # Calibration tokens from each unique disperser.
        seen_dispersers: set[int] = set()
        seen_tok_ids: set[int] = set(id(t) for t in param_to_name)
        for spectrum in spectra:
            disp = spectrum.disperser
            if id(disp) not in seen_dispersers:
                seen_dispersers.add(id(disp))
                for tok in (disp.r_scale, disp.flux_scale, disp.pix_offset):
                    if id(tok) not in seen_tok_ids:
                        tok_name = tok.name
                        seen_tok_ids.add(id(tok))
                        all_priors[tok_name] = tok.prior
                        param_to_name[tok] = tok_name

        # Continuum parameters: collect unique ContinuumParam tokens by identity.
        # Shared tokens (same object in multiple regions) produce one numpyro site.
        if continuum_config is not None:
            seen_cont_ids: set[int] = set()
            for resolved in continuum_config.resolved_params:
                for tok in resolved.values():
                    if id(tok) not in seen_cont_ids:
                        tok_name = tok.name
                        seen_cont_ids.add(id(tok))
                        all_priors[tok_name] = tok.prior
                        param_to_name[tok] = tok_name

        self._all_priors = all_priors
        self._dep_order = (
            topological_sort(all_priors, param_to_name) if all_priors else []
        )
        # Reverse mapping: site name → token object, for obj_ctx in unite_model.
        # Continuum params have no token objects and are intentionally absent.
        self._line_config = line_config
        self._name_to_token: dict[str, object] = {
            name: tok for tok, name in param_to_name.items()
        }

    @property
    def matrices(self) -> ConfigMatrices:
        """Precomputed matrices (after coverage filtering)."""
        return self._matrices


[docs]
    def build(
        self,
        *,
        integration_mode: str = 'analytic',
        n_super: int = 10,
        conv_half_width: int | None = None,
    ) -> tuple[Callable, ModelArgs]:
        """Build the numpyro model function and its arguments.

        Parameters
        ----------
        integration_mode : str, optional
            How line profiles are integrated over pixels.  One of:

            * ``'analytic'`` (default) — exact CDF-based integration
              for emission profiles and pixel-center evaluation for
              absorption profiles.
            * ``'convolution'`` — evaluates the intrinsic model
              (``lsf_fwhm=0``) on a uniform fine sub-pixel grid of
              ``n_super`` points per pixel, numerically convolves with
              the wavelength-dependent Gaussian LSF, then pixel-averages.
              Correctly computes ``LSF ⊗ [F · exp(-τ · φ_intrinsic)]``
              rather than ``F · exp(-τ · LSF ⊗ φ)``, eliminating the
              LSF pre-convolution approximation for absorption lines.

        n_super : int, optional
            Number of uniform sub-pixel evaluation points per pixel
            (default: 10).  Only used when
            ``integration_mode='convolution'``.  Higher values resolve
            narrower intrinsic line profiles at the cost of speed.
            ``n_super=10`` is adequate for NIRSpec gratings; increase to
            20 for narrow absorbers at PRISM resolution.
        conv_half_width : int or None, optional
            Half-width of the banded LSF convolution kernel in fine-grid
            indices (default: ``None``).  When ``None``, auto-computed at
            build time as ``ceil(4 * max_sigma * n_super / min_dlam_pix)``
            where ``max_sigma`` is the largest LSF sigma across all spectra
            and ``min_dlam_pix`` is the smallest pixel width.
            Only used when ``integration_mode='convolution'``.

        Returns
        -------
        model_fn : callable
            The numpyro model function (signature: ``model_fn(args)``).
        model_args : ModelArgs
            Pre-built data bundle to pass to the model function.

        Raises
        ------
        ValueError
            If *integration_mode* is not one of the valid values.
        """
        valid_modes = ('analytic', 'convolution')
        if integration_mode not in valid_modes:
            msg = (
                f'integration_mode must be one of {valid_modes}, '
                f'got {integration_mode!r}.'
            )
            raise ValueError(msg)

        # Trim spectra to union of continuum regions (observed frame).
        # Pixels outside all regions have model = 0 and would corrupt the
        # likelihood if observed flux is nonzero.  Trimming also reduces
        # array sizes passed to JAX.
        z = self._spectra.redshift
        if self._cont_config is not None:
            trimmed_spectra: list[Spectrum] = []
            for s in self._spectra:
                mask = jnp.zeros(s.npix, dtype=bool)
                for region in self._cont_config:
                    conv = _get_conversion_factor(region.unit, s.unit)
                    obs_low = region.low * conv * (1.0 + z)
                    obs_high = region.high * conv * (1.0 + z)
                    mask = mask | s.pixel_mask(obs_low, obs_high)
                trimmed = s._sliced(mask)
                if trimmed.npix > 0:
                    trimmed_spectra.append(trimmed)
                else:
                    warnings.warn(
                        f'Spectrum {s.name!r} has no pixels overlapping '
                        f'any continuum region and will be excluded from '
                        f'the fit.',
                        UserWarning,
                        stacklevel=2,
                    )
            if not trimmed_spectra:
                warnings.warn(
                    'All spectra are fully masked after trimming to '
                    'continuum regions. The resulting model has no spectra '
                    'and should not be used for fitting. Check that your '
                    'continuum configuration covers the observed wavelength '
                    'range.',
                    UserWarning,
                    stacklevel=2,
                )
        else:
            trimmed_spectra = list(self._spectra)

        # For convolution mode, compute the kernel half-width (in fine-grid indices)
        # from the maximum LSF sigma and minimum fine-grid spacing across all spectra.
        if integration_mode == 'convolution':
            if conv_half_width is None:
                max_lsf_fwhm = 0.0
                min_dlam = float('inf')
                for s in trimmed_spectra:
                    wl_scale = _get_conversion_factor(s.unit, self._canonical_unit)
                    pix_mid_disp = (s.low + s.high) / 2.0
                    r_arr = jnp.asarray(s.disperser.R(pix_mid_disp))
                    lsf = jnp.asarray(pix_mid_disp * wl_scale) / r_arr
                    max_lsf_fwhm = max(max_lsf_fwhm, float(jnp.max(lsf)))
                    pix_widths = (s.high - s.low) * wl_scale
                    min_dlam = min(min_dlam, float(jnp.min(pix_widths)))
                max_sigma = max_lsf_fwhm * _FWHM_TO_SIGMA
                conv_half_width = max(
                    1, math.ceil(_LSF_TRUNCATION_SIGMA * max_sigma * n_super / min_dlam)
                )
            n_super_val: int | None = n_super
            conv_half_width_val: int | None = conv_half_width
        else:
            n_super_val = None
            conv_half_width_val = None

        # Per-spectrum wavelength conversion factors.
        spec_to_canonical = [
            _get_conversion_factor(s.unit, self._canonical_unit)
            for s in trimmed_spectra
        ]

        # Per-spectrum flux normalization.
        norm_factors = [_compute_norm_factor(s) for s in trimmed_spectra]

        # Line flux scale (Quantity from Spectra.compute_scales).
        line_scale_qty = self._spectra.line_scale
        # Continuum scale (Quantity from Spectra.compute_scales; fallback).
        cont_scale_qty = self._spectra.continuum_scale

        # Convert Quantity scales to per-spectrum float values.
        # line_flux_scale needs units of [flux_density * canonical_wl_unit]
        # for each spectrum.
        # continuum_scale needs units of [flux_density] for each spectrum.
        canonical_unit = self._canonical_unit
        line_flux_scales: list[float] = []
        continuum_scales: list[float] = []
        assert line_scale_qty is not None, (
            'line_scale must be set before building the model'
        )
        for s in trimmed_spectra:
            target_line_unit = s.flux_unit * canonical_unit
            lfs = float(line_scale_qty.to(target_line_unit).value)
            line_flux_scales.append(lfs)

            if cont_scale_qty is not None:
                cs = float(cont_scale_qty.to(s.flux_unit).value)
            else:
                cs = 1.0
            continuum_scales.append(cs)

        flux_units = [s.flux_unit for s in trimmed_spectra]

        # Pre-convert continuum region bounds to canonical unit.
        if self._cont_config is not None:
            cont_low = []
            cont_high = []
            cont_center = []
            cont_nw_conv = []
            cont_forms = []
            for region in self._cont_config:
                conv = _get_conversion_factor(region.unit, self._canonical_unit)
                cont_low.append(region.low * conv)
                cont_high.append(region.high * conv)
                cont_center.append(region.center * conv)
                cont_nw_conv.append(conv)
                cont_forms.append(region.form)
        else:
            cont_low = None
            cont_high = None
            cont_center = None
            cont_nw_conv = None
            cont_forms = None

        line_labels = _make_line_labels(self._line_config)
        continuum_labels = (
            _make_continuum_labels(self._cont_config)
            if self._cont_config is not None
            else []
        )

        # cont_applies[k] = True when tau line k (zorder_k > cont_zorder) attenuates the continuum.
        cm = self._matrices
        cont_zorder = self._cont_config.zorder if self._cont_config is not None else 0
        cont_applies = (cm.line_zorders > cont_zorder) & cm.is_tau

        local_codes, int_fn, eval_fn, eval_centers_fn = _make_specialized_dispatch(
            self._matrices.profile_codes
        )

        args = ModelArgs(
            matrices=self._matrices,
            spectra=trimmed_spectra,
            redshift=self._spectra.redshift,
            cont_config=self._cont_config,
            cont_resolved_params=(
                self._cont_config.resolved_params
                if self._cont_config is not None
                else None
            ),
            all_priors=self._all_priors,
            dependency_order=self._dep_order,
            name_to_token=self._name_to_token,
            spec_to_canonical=spec_to_canonical,
            cont_low=cont_low,
            cont_high=cont_high,
            cont_center=cont_center,
            cont_nw_conv=cont_nw_conv,
            cont_forms=cont_forms,
            norm_factors=norm_factors,
            line_flux_scales=line_flux_scales,
            continuum_scales=continuum_scales,
            canonical_unit=canonical_unit,
            flux_units=flux_units,
            line_scale_quantity=line_scale_qty,
            continuum_scale_quantity=cont_scale_qty,
            line_labels=line_labels,
            continuum_labels=continuum_labels,
            cont_applies=cont_applies,
            integration_mode=integration_mode,
            n_super=n_super_val,
            conv_half_width=conv_half_width_val,
            _profile_codes_local=local_codes,
            _integrate_fn=int_fn,
            _evaluate_fn=eval_fn,
            _evaluate_at_centers_fn=eval_centers_fn,
        )
        return unite_model, args



[docs]
    def fit(
        self,
        num_warmup: int = 250,
        num_samples: int = 1000,
        num_chains: int = 1,
        seed: int = 0,
        progress_bar: bool = True,
        integration_mode: str = 'analytic',
        n_super: int = 10,
    ) -> tuple[dict, ModelArgs]:
        """Fit the model using NUTS sampling (convenience wrapper).

        This method builds the model, runs MCMC with the NUTS kernel, and
        returns the posterior samples. For more control over the sampler
        (e.g., custom kernel, SVI, nested sampling), call :meth:`build`
        directly and use numpyro's inference APIs.

        Parameters
        ----------
        num_warmup : int, optional
            Number of warmup iterations per chain (default: 1000).
        num_samples : int, optional
            Number of posterior samples per chain (default: 1000).
        num_chains : int, optional
            Number of MCMC chains to run in parallel (default: 1).
        seed : int, optional
            Random seed for JAX's PRNG (default: 0).
        progress_bar : bool, optional
            Whether to display a progress bar (default: True).
        integration_mode : str, optional
            Line integration mode (default: ``'analytic'``).  See
            :meth:`build` for details.
        n_super : int, optional
            Sub-pixel evaluation points per pixel for convolution mode
            (default: 10).  See :meth:`build` for details.

        Returns
        -------
        tuple
            ``(samples, model_args)`` where ``samples`` is a dictionary with
            parameter names as keys and shape ``(num_chains * num_samples,)``
            per parameter, and ``model_args`` is the :class:`ModelArgs` bundle.
            Two additional diagnostic keys are always present:

            * ``'log_prob'`` — log joint probability (log-likelihood + log-prior)
              for each sample; proportional to log-posterior up to a constant.
              Use ``np.argmax(samples['log_prob'])`` to find the MAP sample.
            * ``'log_likelihood'`` — sum of per-pixel Normal log-probabilities
              across all spectra for each sample.

        Examples
        --------
        >>> samples, model_args = builder.fit(num_warmup=200, num_samples=500, num_chains=4)
        """
        import jax
        import numpy as _np
        from numpyro import infer
        from numpyro.infer.util import log_likelihood as _npy_ll

        model_fn, model_args = self.build(
            integration_mode=integration_mode, n_super=n_super
        )
        mcmc = infer.MCMC(
            infer.NUTS(model_fn, dense_mass=True),
            num_warmup=num_warmup,
            num_samples=num_samples,
            num_chains=num_chains,
            progress_bar=progress_bar,
        )
        mcmc.run(
            jax.random.PRNGKey(seed), model_args, extra_fields=('potential_energy',)
        )
        samples = mcmc.get_samples()
        # log_prob = log joint = log_likelihood + log_prior (up to a constant).
        extra = mcmc.get_extra_fields()
        samples['log_prob'] = -_np.asarray(extra['potential_energy'])
        # log_likelihood: sum of per-pixel Normal log-probs across all spectra.
        ll_dict = _npy_ll(model_fn, samples, model_args)
        if ll_dict:
            samples['log_likelihood'] = sum(
                _np.asarray(v).reshape(_np.asarray(v).shape[0], -1).sum(axis=-1)
                for v in ll_dict.values()
            )
        return samples, model_args




# ------------------------------------------------------------------
# Normalization helpers
# ------------------------------------------------------------------


def _make_line_labels(line_config: LineConfiguration) -> list[str]:
    """Return the unique name for every line entry.

    Since line names are required to be unique within a
    :class:`~unite.line.config.LineConfiguration`, the label for each entry
    is simply its name.  Use ``add_lines`` (which auto-generates names as
    ``'{name}_{center.value:g}'``) or supply explicit unique names to
    ``add_line`` for multiplets and multi-component lines.
    """
    return [entry.name for entry in line_config._entries]


def _make_continuum_labels(cont_config: ContinuumConfiguration) -> list[str]:
    """Build a human-readable label for every continuum region.

    Format: ``'{form_type}_{low:.4g}_{high:.4g}'`` where the wavelength
    values are in the region's native unit and ``form_type`` is the
    lower-cased class name of the functional form (e.g. ``'linear'``,
    ``'powerlaw'``, ``'polynomial'``).

    Examples: ``'linear_6400_6700'``, ``'powerlaw_0.95_2.5'``.
    """
    labels: list[str] = []
    for region in cont_config:
        form_type = type(region.form).__name__.lower()
        low_str = f'{region.low:.4g}'
        high_str = f'{region.high:.4g}'
        labels.append(f'{form_type}_{low_str}_{high_str}')
    return labels


def _compute_norm_factor(s: Spectrum) -> float:
    """Robust scale factor to bring a spectrum's flux to ~O(1).

    Uses the median of the absolute non-zero flux values.

    Parameters
    ----------
    s : Spectrum

    Returns
    -------
    float
        Positive normalization factor.
    """
    absflux = jnp.abs(s.flux)
    positive = absflux[absflux > 0]
    if positive.size == 0:
        fallback = float(jnp.max(s.error))
        return fallback if fallback > 0 else 1.0
    return float(jnp.median(positive))