Source code for sft_wick.workflow.config

"""YAML-driven configuration for the workflow API.

Lets users declare an entire ``System`` / ``Expansion`` /
``Propagators`` / sweep pipeline in a single YAML file, with fields
mapping 1:1 to the Python L1 API so the config is self-documenting.

Invoke via the CLI::

    sft-wick run examples/demo1_config.yaml

Or programmatically::

    from sft_wick.workflow.config import load_workflow_config, run_workflow

    cfg = load_workflow_config("examples/demo1_config.yaml")
    sweep, totals_df = run_workflow(cfg)
"""

from __future__ import annotations

import importlib.util
import math
import os
import sys
from dataclasses import dataclass, field
from pathlib import Path
from typing import Any

import numpy as np


# =========================================================================
# Internal dataclasses — a thin typed mirror of the L1 ``System`` spec
# =========================================================================



[docs]
@dataclass(frozen=True)
class WorkflowConfig:
    """Top-level parsed config."""

    system: "SystemConfig"
    expand: "ExpandConfig"
    propagators: "PropagatorsConfig"
    sweep: "SweepConfig"
    output: list["OutputConfig"] = field(default_factory=list)




[docs]
@dataclass(frozen=True)
class SystemConfig:
    field_name: str
    n_components: int
    linear: dict  # parsed at build time
    noise: dict
    vertices: list
    nonlocal_vertices: list = field(default_factory=list)
    t_min: float = 0.0
    # Resolved at parse time so that noise.kappa2.type='callable_module'
    # (and any future module-loaded specs in the system block) can resolve
    # paths relative to the YAML file at build time.
    base_dir: Path | None = None




[docs]
@dataclass(frozen=True)
class ExpandConfig:
    observable: tuple
    orders: tuple
    response_phase: bool = True
    ito: bool = True
    collect_topology: bool = True
    iso_R: Any = None
    diag_R: bool = True
    diag_C: bool = True
    iso_C: bool = False
    cache_path: Any = None
    n_jobs: int = 1




[docs]
@dataclass(frozen=True)
class PropagatorsConfig:
    t_max: float
    n_grid_t: int = 60
    dt: float | None = None
    homogeneity: Any = None
    r_max: Any = None
    n_grid_r: Any = None
    n_grid_cos: Any = None
    x_max: Any = None
    n_grid_x: Any = None
    n_jobs: int = 1
    c_closed_form_module: Any = None
    c_closed_form_attr: str = "C_fn"
    c_closed_form_only: bool = False
    c_closed_form_vectorized: bool = False
    cache_path: Any = None
    interp_method: str = "linear"
    c_method: str = "dblquad"  # 'dblquad' | 'gauss_legendre'
    c_n_gauss: int = 20  # nodes per dim under c_method='gauss_legendre'
    diag_C: bool = True  # set False to preserve off-diagonal C entries

    #                       (e.g. lensing kappa-gamma_+ cross). Requires
    #                       c_closed_form_only=True. When False, also
    #                       sets expand.diag_C=False so the symbolic
    #                       simplification keeps the (a, b) observable
    #                       indices distinct -- without that step the
    #                       order-0 cross pair (a != b) collapses to 0
    #                       via the KroneckerDelta(a, b) inserted by
    #                       DiagramTerm.apply_diagonal.



[docs]
@dataclass(frozen=True)
class SweepConfig:
    positions_grid: dict
    t_final_grid: list
    component_pairs: list
    orders: Any = None
    vertex_types: Any = None
    integrate_over: Any = None
    method: str = "qmc_vectorized"
    n_samples: int = 2 ** 13
    seed: int = 42
    n_jobs: int = 1
    n_gauss: int = 8  # used only when method='gauss_legendre'




[docs]
@dataclass(frozen=True)
class OutputConfig:
    type: str  # "table" | "npz" | "plot"
    path: Any = None
    # Type-specific:
    format: str = "markdown"   # for table
    x: Any = None              # for plot
    y: str = "value"
    hue: Any = "order"
    facet_col: Any = None



# =========================================================================
# YAML → WorkflowConfig
# =========================================================================



[docs]
def load_workflow_config(
    path: str | Path,
    overrides: dict | None = None,
) -> WorkflowConfig:
    """Load and validate a workflow YAML config.

    Args:
        path: path to a YAML file.
        overrides: optional ``{dotted.key: value}`` dict to patch
            the loaded config (e.g. ``{"sweep.seed": 7}``).

    Returns:
        A :class:`WorkflowConfig` ready to pass to :func:`run_workflow`.
    """
    try:
        import yaml
    except ImportError as e:
        raise ImportError(
            "YAML workflow configs require PyYAML.  "
            "Install with `pip install pyyaml`."
        ) from e

    path = Path(path)
    with path.open() as f:
        data = yaml.safe_load(f)

    if overrides:
        for dotted_key, value in overrides.items():
            _apply_override(data, dotted_key, value)

    return _parse_workflow(data, base_dir=path.parent)



def _apply_override(data: dict, dotted_key: str, value: Any) -> None:
    """Apply a ``"a.b.c": value`` override to a nested dict."""
    parts = dotted_key.split(".")
    cur = data
    for p in parts[:-1]:
        if not isinstance(cur, dict) or p not in cur:
            raise KeyError(
                f"override key '{dotted_key}' does not exist in config"
            )
        cur = cur[p]
    leaf = parts[-1]
    if not isinstance(cur, dict) or leaf not in cur:
        raise KeyError(
            f"override key '{dotted_key}' does not exist in config"
        )
    cur[leaf] = value


def _parse_workflow(data: dict, base_dir: Path) -> WorkflowConfig:
    system_d = _require_dict(data, "system")
    expand_d = _require_dict(data, "expand")
    props_d = _require_dict(data, "propagators")
    sweep_d = _require_dict(data, "sweep")
    output_d = data.get("output", [])

    # Extract the top-level dt before parsing system so the linear gamma-spline
    # cache can derive its own n_grid_cache from the same dt by default.
    default_dt = props_d.get("dt")
    if default_dt is not None:
        default_dt = float(default_dt)

    system_cfg = _parse_system(system_d, base_dir, default_dt=default_dt)
    expand_cfg = _parse_expand(expand_d)
    props_cfg = _parse_propagators(props_d, base_dir)
    sweep_cfg = _parse_sweep(sweep_d)
    output_cfgs = [_parse_output(o) for o in (output_d or [])]

    return WorkflowConfig(
        system=system_cfg,
        expand=expand_cfg,
        propagators=props_cfg,
        sweep=sweep_cfg,
        output=output_cfgs,
    )


def _require_dict(d: dict, key: str) -> dict:
    if key not in d:
        raise ValueError(f"config missing required top-level section '{key}'")
    if not isinstance(d[key], dict):
        raise ValueError(f"config section '{key}' must be a mapping")
    return d[key]


def _parse_system(
    d: dict, base_dir: Path, *, default_dt: float | None = None
) -> SystemConfig:
    fld = d.get("field", {}) or {}
    name = fld.get("name", "phi")
    nc = int(fld.get("n_components", 1))

    linear = d.get("linear")
    if linear is None:
        raise ValueError("system.linear is required")
    linear = _resolve_linear(dict(linear), base_dir, default_dt=default_dt)

    noise = d.get("noise")
    if noise is None:
        raise ValueError("system.noise is required")

    vertices = d.get("vertices", []) or []
    nonlocal_vertices = d.get("nonlocal_vertices", []) or []

    # Resolve coupling tensor file paths relative to the YAML file.
    vertices = [_resolve_coupling(v, base_dir) for v in vertices]
    nonlocal_vertices = [
        _resolve_coupling(v, base_dir) for v in nonlocal_vertices
    ]

    return SystemConfig(
        field_name=name, n_components=nc,
        linear=linear, noise=noise,
        vertices=vertices, nonlocal_vertices=nonlocal_vertices,
        t_min=float(d.get("t_min", 0.0)),
        base_dir=base_dir,
    )


def _resolve_coupling(v: dict, base_dir: Path) -> dict:
    """Resolve the vertex spec's ``coupling`` to either an inline
    numpy array or a callable loaded from a user module.

    Priority order:
      ``coupling``          — inline tensor (nested YAML lists).
      ``coupling_path``     — path to an ``.npy`` file, loaded as a
                              numpy array.
      ``coupling_module``   — path to a ``.py`` module exporting an
                              attribute (default ``coupling_fn``)
                              used as a callable ``fn(n_list,
                              t_list) -> tensor``.  Required for
                              spacetime-dependent non-local vertices
                              like demo2's ``κ^{(3)}``.
    """
    out = dict(v)
    if "coupling_path" in out and "coupling" not in out:
        p = (base_dir / out.pop("coupling_path")).resolve()
        out["coupling"] = np.load(p)
    elif "coupling_module" in out and "coupling" not in out:
        mod_path = (base_dir / out.pop("coupling_module")).resolve()
        attr = out.pop("coupling_attr", "coupling_fn")
        out["coupling"] = _load_callable_from_module(mod_path, attr)
    return out


def _resolve_linear(
    lin: dict, base_dir: Path, *, default_dt: float | None = None
) -> dict:
    """Resolve ``system.linear`` based on its ``type`` field.

    Supported lowerings:

    ``type: diagonal`` (default) -> :class:`sft_wick.workflow.specs.DiagonalA`

        ``gamma``: inline list of floats, or a 1D nested-list array.
        ``gamma_module``: path to a ``.py`` module exporting an attribute
            (default ``gamma``) used as a callable ``gamma(t) -> array(N)``.
            Required for spacetime-dependent linear drift such as the
            Sachs-saddle ``2 theta^(sa)(lambda)``.

        Discretization: the spline cache uses ``n_grid_cache`` points
        uniformly on ``[0, t_max_cache]``. When the user provides ``dt``
        (here or via ``propagators.dt``), it is converted to
        ``n_grid_cache = ceil(t_max_cache / dt)`` so a single ``dt``
        controls every grid in the workflow. Providing both ``dt`` and
        ``n_grid_cache`` is rejected to avoid ambiguity.

    ``type: explicit`` -> :class:`sft_wick.workflow.specs.ExplicitR`

        Escape hatch for scalar closed-form R: the user supplies
        ``R(t1, t2)`` directly, so the wrapper bypasses the
        gamma-spline cache entirely. This unlocks YAML use cases the
        diagonal lowering can't express -- e.g. causal kernels with
        non-exponential decay, or pre-computed spline callables loaded
        from disk.

        ``R_time_module``: path to a ``.py`` module exporting an
            attribute (default ``R_time``) used as a callable
            ``R_time(t1, t2) -> float``. Must enforce causality
            (return 0 when ``t1 < t2``).
        ``iso_R``: must be ``True`` (default). Matrix-valued R remains
            an L0/L1 escape hatch; the L2 YAML numerical wrappers are
            scalar-R only.

        γ-spline cache knobs (``gamma``, ``gamma_module``, ``dt``,
        ``n_grid_cache``, ``t_max_cache``) do not apply under this
        type and raise if specified -- the propagator is the user's
        callable, not a derived spline.
    """
    lt = lin.get("type", "diagonal")
    if lt == "explicit":
        return _resolve_linear_explicit(lin, base_dir)
    if lt == "diagonal":
        return _resolve_linear_diagonal(lin, base_dir, default_dt=default_dt)
    raise ValueError(
        f"Unsupported linear operator type {lt!r}.  "
        f"Supported: 'diagonal', 'explicit'."
    )


def _resolve_linear_diagonal(
    lin: dict, base_dir: Path, *, default_dt: float | None = None
) -> dict:
    """Parse-time resolver for ``type: diagonal``."""
    if "gamma" in lin and "gamma_module" in lin:
        raise ValueError(
            "system.linear: provide exactly one of {'gamma', 'gamma_module'}"
        )
    if "gamma_module" in lin and "gamma" not in lin:
        mod_path = (base_dir / lin.pop("gamma_module")).resolve()
        attr = lin.pop("gamma_attr", "gamma")
        lin["gamma"] = _load_callable_from_module(mod_path, attr)

    # dt -> n_grid_cache derivation. linear.dt overrides propagators.dt.
    linear_dt = lin.pop("dt", None)
    effective_dt = float(linear_dt) if linear_dt is not None else default_dt
    if effective_dt is not None:
        if effective_dt <= 0.0:
            raise ValueError(
                f"system.linear.dt (or propagators.dt) must be positive, "
                f"got {effective_dt}"
            )
        if "n_grid_cache" in lin:
            raise ValueError(
                "system.linear: specify exactly one of {'dt' (here or in "
                "propagators), 'n_grid_cache'}; got both."
            )
        t_max_cache = float(lin.get("t_max_cache", 100.0))
        lin["n_grid_cache"] = max(2, int(math.ceil(t_max_cache / effective_dt)))
    return lin


def _resolve_linear_explicit(lin: dict, base_dir: Path) -> dict:
    """Parse-time resolver for ``type: explicit``.

    Loads ``R_time`` from a user module and rejects fields that only
    make sense under the diagonal-with-gamma-spline path. The module
    is registered for cross-process by-value serialisation by
    :func:`_load_callable_from_module`, so the loaded callable composes
    with ``propagators.n_jobs > 1`` / ``sweep.n_jobs > 1`` even when
    joblib reuses a worker pool across calls.
    """
    forbidden = (
        "gamma", "gamma_module", "gamma_attr",
        "dt", "n_grid_cache", "t_max_cache",
    )
    present = [k for k in forbidden if k in lin]
    if present:
        raise ValueError(
            f"system.linear.type='explicit' does not accept "
            f"gamma-spline fields {present!r}.  Use 'type: diagonal' for "
            f"those, or remove them under 'type: explicit'."
        )
    if "R_time" in lin:
        raise ValueError(
            "system.linear.type='explicit' does not support an inline "
            "'R_time' (a callable cannot be expressed in YAML).  Use "
            "'R_time_module' + 'R_time_attr' instead."
        )
    if "R_time_module" not in lin:
        raise ValueError(
            "system.linear.type='explicit' requires "
            "'R_time_module: <relative path to .py file>'."
        )
    iso_r = lin.get("iso_R", True)
    if isinstance(iso_r, str):
        iso_r = iso_r.strip().lower() not in {"0", "false", "no", "off"}
    else:
        iso_r = bool(iso_r)
    if not iso_r:
        raise ValueError(
            "system.linear.type='explicit' currently supports only scalar "
            "R_time callables; set iso_R: true. Matrix-valued R is "
            "available from the L0/L1 Python APIs, but not from L2 YAML."
        )
    lin["iso_R"] = True
    mod_path = (base_dir / lin.pop("R_time_module")).resolve()
    attr = lin.pop("R_time_attr", "R_time")
    lin["R_time"] = _load_callable_from_module(mod_path, attr)
    return lin


def _load_callable_from_module(path: Path, attr: str):
    """Import ``path`` as a standalone module and return
    ``getattr(module, attr)``.

    Registers the module under its file basename (``path.stem``) and ensures
    ``path.parent`` is on both ``sys.path`` (for the current process) and
    the ``PYTHONPATH`` environment variable (for subprocess workers, e.g.
    joblib loky). Without the env-var step, a worker process started after
    this call cannot re-import the module by name, and unpickling a cache
    that holds the loaded callable raises ``BrokenProcessPool`` /
    ``ModuleNotFoundError``.
    """
    parent_dir = str(path.parent.resolve())
    if parent_dir not in sys.path:
        sys.path.append(parent_dir)

    # Propagate parent_dir to subprocess workers via PYTHONPATH. loky
    # workers inherit os.environ but not the parent's sys.path mods,
    # so this is the durable channel.
    pp = os.environ.get("PYTHONPATH", "")
    pp_parts = pp.split(os.pathsep) if pp else []
    if parent_dir not in pp_parts:
        os.environ["PYTHONPATH"] = os.pathsep.join([parent_dir, *pp_parts])

    module_name = path.stem
    spec_obj = importlib.util.spec_from_file_location(module_name, path)
    if spec_obj is None or spec_obj.loader is None:
        raise ImportError(
            f"Cannot load coupling module {path!r}."
        )
    module = importlib.util.module_from_spec(spec_obj)
    sys.modules[module_name] = module
    spec_obj.loader.exec_module(module)
    fn = getattr(module, attr, None)
    if fn is None or not callable(fn):
        raise AttributeError(
            f"Module {path!r} has no callable attribute {attr!r}."
        )
    _register_module_by_value(module)
    return fn


def _register_module_by_value(module) -> None:
    """Register ``module`` for cross-process by-value serialisation.

    Modules loaded via :func:`importlib.util.spec_from_file_location`
    are not importable by name in subprocess workers. joblib's loky
    backend uses a persistent worker pool whose ``sys.path`` /
    ``PYTHONPATH`` is fixed at first-pool-creation time, so a worker
    spawned during an earlier test won't have a later test's
    ``tmp_path`` available.

    cloudpickle's ``register_pickle_by_value`` flips the encoding so
    the module's source is shipped inline with each task. Workers no
    longer need to import anything by name.

    Falls back silently if cloudpickle is unavailable (joblib pulls
    it in, but a custom install might not).
    """
    try:
        from joblib.externals import cloudpickle
    except ImportError:  # pragma: no cover - joblib pulls in cloudpickle
        return
    try:
        cloudpickle.register_pickle_by_value(module)
    except (TypeError, ValueError):  # pragma: no cover - defensive
        # cloudpickle rejects modules that are part of a package or
        # don't have a real source file. Either case means the worker
        # can already import the module by name, so by-value encoding
        # is not needed.
        pass


def _parse_expand(d: dict) -> ExpandConfig:
    obs = d.get("observable")
    if obs is None:
        raise ValueError("expand.observable is required")
    orders = d.get("orders")
    if orders is None:
        raise ValueError("expand.orders is required")
    return ExpandConfig(
        observable=tuple(obs),
        orders=tuple(int(o) for o in orders),
        response_phase=bool(d.get("response_phase", True)),
        ito=bool(d.get("ito", True)),
        collect_topology=bool(d.get("collect_topology", True)),
        iso_R=d.get("iso_R"),
        diag_R=bool(d.get("diag_R", True)),
        diag_C=bool(d.get("diag_C", True)),
        iso_C=bool(d.get("iso_C", False)),
        cache_path=d.get("cache_path"),
        n_jobs=int(d.get("n_jobs", 1)),
    )


def _parse_propagators(d: dict, base_dir: Path) -> PropagatorsConfig:
    if "t_max" not in d:
        raise ValueError("propagators.t_max is required")
    module_spec = d.get("c_closed_form_module")
    if module_spec is not None:
        module_spec = str((base_dir / module_spec).resolve())

    t_max = float(d["t_max"])
    dt = d.get("dt")
    has_n_grid_t = "n_grid_t" in d
    if dt is not None:
        dt = float(dt)
        if dt <= 0.0:
            raise ValueError(f"propagators.dt must be positive, got {dt}")
        if has_n_grid_t:
            raise ValueError(
                "propagators: specify exactly one of {'dt', 'n_grid_t'}; "
                "got both."
            )
        n_grid_t = max(2, int(math.ceil(t_max / dt)))
    else:
        n_grid_t = int(d.get("n_grid_t", 60))

    return PropagatorsConfig(
        t_max=t_max,
        n_grid_t=n_grid_t,
        dt=dt,
        homogeneity=d.get("homogeneity"),
        r_max=d.get("r_max"),
        n_grid_r=d.get("n_grid_r"),
        n_grid_cos=d.get("n_grid_cos"),
        x_max=d.get("x_max"),
        n_grid_x=d.get("n_grid_x"),
        n_jobs=int(d.get("n_jobs", 1)),
        c_closed_form_module=module_spec,
        c_closed_form_attr=str(d.get("c_closed_form_attr", "C_fn")),
        c_closed_form_only=bool(d.get("c_closed_form_only", False)),
        c_closed_form_vectorized=bool(d.get("c_closed_form_vectorized", False)),
        cache_path=d.get("cache_path"),
        interp_method=str(d.get("interp_method", "linear")),
        c_method=str(d.get("c_method", "dblquad")),
        c_n_gauss=int(d.get("c_n_gauss", 20)),
        diag_C=bool(d.get("diag_C", True)),
    )


def _parse_sweep(d: dict) -> SweepConfig:
    if "positions_grid" not in d:
        raise ValueError("sweep.positions_grid is required")
    if "t_final_grid" not in d:
        raise ValueError("sweep.t_final_grid is required")
    if "component_pairs" not in d:
        raise ValueError("sweep.component_pairs is required")
    cps = [tuple(pair) for pair in d["component_pairs"]]
    return SweepConfig(
        positions_grid={k: list(v) for k, v in d["positions_grid"].items()},
        t_final_grid=list(d["t_final_grid"]),
        component_pairs=cps,
        orders=d.get("orders"),
        vertex_types=d.get("vertex_types"),
        integrate_over=d.get("integrate_over"),
        method=str(d.get("method", "qmc_vectorized")),
        n_samples=int(d.get("n_samples", 2 ** 13)),
        seed=int(d.get("seed", 42)),
        n_jobs=int(d.get("n_jobs", 1)),
        n_gauss=int(d.get("n_gauss", 8)),
    )


def _parse_output(d: dict) -> OutputConfig:
    if "type" not in d:
        raise ValueError("each output entry must specify a 'type'")
    t = d["type"]
    if t not in ("table", "npz", "plot"):
        raise ValueError(
            f"output type must be one of 'table', 'npz', 'plot'; "
            f"got {t!r}."
        )
    return OutputConfig(
        type=t,
        path=d.get("path"),
        format=str(d.get("format", "markdown")),
        x=d.get("x"),
        y=str(d.get("y", "value")),
        hue=d.get("hue", "order"),
        facet_col=d.get("facet_col"),
    )


# =========================================================================
# WorkflowConfig → L1 System
# =========================================================================



[docs]
def build_system(cfg: SystemConfig):
    """Lower a parsed :class:`SystemConfig` to a
    :class:`sft_wick.System` instance."""
    from . import specs as sp
    from .system import System

    # Linear operator
    lin_d = dict(cfg.linear)
    lt = lin_d.pop("type", "diagonal")
    if lt == "diagonal":
        gamma = lin_d["gamma"]
        # Pass callables through to DiagonalA; only flatten static lists/arrays.
        gamma_arg = gamma if callable(gamma) else list(gamma)
        diag_kwargs = {"gamma": gamma_arg}
        for k in ("t_max_cache", "n_grid_cache"):
            if k in lin_d:
                diag_kwargs[k] = lin_d[k]
        linear = sp.DiagonalA(**diag_kwargs)
    elif lt == "explicit":
        # User-supplied R(t1, t2): bypass the gamma-spline cache entirely.
        iso_r = lin_d.get("iso_R", True)
        if isinstance(iso_r, str):
            iso_r = iso_r.strip().lower() not in {"0", "false", "no", "off"}
        else:
            iso_r = bool(iso_r)
        if not iso_r:
            raise ValueError(
                "system.linear.type='explicit' currently supports only scalar "
                "R_time callables; set iso_R: true."
            )
        linear = sp.ExplicitR(
            R_time=lin_d["R_time"],
            iso_R=True,
        )
    else:
        raise ValueError(
            f"Unsupported linear operator type {lt!r}.  "
            f"Supported: 'diagonal', 'explicit'."
        )

    # Noise
    noise = _build_noise(cfg.noise, base_dir=cfg.base_dir)

    def _coupling_value(v: dict):
        c = v["coupling"]
        # If already a callable (from coupling_module), pass through.
        return c if callable(c) else np.asarray(c)

    vertices = [
        sp.LocalVertex(name=v["name"], coupling=_coupling_value(v))
        for v in cfg.vertices
    ]
    nonlocal_vertices = [
        sp.NonLocalVertex(
            name=v["name"], order=int(v["order"]),
            coupling=_coupling_value(v),
            coupling_vectorized=bool(v.get("coupling_vectorized", False)),
            equal_time=bool(v.get("equal_time", False)),
            already_R_contracted=bool(v.get("already_R_contracted", False)),
        )
        for v in cfg.nonlocal_vertices
    ]

    return System(
        field=sp.FieldSpec(cfg.field_name, n_components=cfg.n_components),
        linear=linear,
        noise=noise,
        vertices=tuple(vertices),
        nonlocal_vertices=tuple(nonlocal_vertices),
        t_min=cfg.t_min,
    )



def _build_noise(d: dict, base_dir: Path | None = None):
    from . import specs as sp

    k2_d = dict(d["kappa2"])
    kt = k2_d.pop("type")
    if kt == "separable_translation":
        temporal = _build_kernel(k2_d["temporal"], axis="time")
        spatial = _build_kernel(k2_d["spatial"], axis="space")
        kappa2 = sp.SeparableTranslation(temporal=temporal, spatial=spatial)
    elif kt == "separable_rotation":
        temporal = _build_kernel(k2_d["temporal"], axis="time")
        angular = _build_kernel(k2_d["angular"], axis="angular")
        kappa2 = sp.SeparableRotation(temporal=temporal, angular=angular)
    elif kt == "callable_module":
        if base_dir is None:
            raise ValueError(
                "noise.kappa2.type='callable_module' requires base_dir; "
                "the workflow loader should pass it through."
            )
        if "module" not in k2_d:
            raise ValueError(
                "noise.kappa2.type='callable_module' requires "
                "'module: <relative path to .py file>'."
            )
        mod_path = (base_dir / k2_d.pop("module")).resolve()
        attr = k2_d.pop("attr", "kappa2")
        fn = _load_callable_from_module(mod_path, attr)
        kappa2 = sp.GeneralKappa2(fn=fn)
    else:
        raise ValueError(
            f"Unsupported kappa2.type {kt!r}.  Supported: "
            f"'separable_translation', 'separable_rotation', 'callable_module'."
        )

    sigma2 = None
    sig_d = d.get("sigma2")
    if sig_d is not None:
        st = dict(sig_d).pop("type", "constant")
        if st == "constant":
            sigma2 = sp.ConstantImpulse(
                amplitude=sig_d.get("amplitude", 0.0)
            )
        elif st == "callable_module":
            if base_dir is None:
                raise ValueError(
                    "noise.sigma2.type='callable_module' requires base_dir; "
                    "the workflow loader should pass it through."
                )
            if "module" not in sig_d:
                raise ValueError(
                    "noise.sigma2.type='callable_module' requires "
                    "'module: <relative path to .py file>'."
                )
            mod_path = (base_dir / sig_d["module"]).resolve()
            attr = sig_d.get("attr", "sigma2")
            fn = _load_callable_from_module(mod_path, attr)
            sigma2 = sp.CustomImpulse(fn=fn)
        else:
            raise ValueError(
                f"Unsupported sigma2.type {st!r}.  Supported: "
                f"'constant', 'callable_module'."
            )

    return sp.GaussianNoise(kappa2=kappa2, sigma2=sigma2)


def _build_kernel(d: dict, axis: str):
    from . import specs as sp

    kt = d.get("type", "exponential")
    if axis == "time":
        if kt == "exponential":
            return sp.ExponentialTemporal(lam=d["lam"], sigma_t=d["sigma_t"])
        if kt == "gaussian":
            return sp.GaussianTemporal(lam=d["lam"], sigma_t=d["sigma_t"])
    elif axis == "space":
        if kt == "exponential":
            return sp.ExponentialSpatial(sigma_x=d["sigma_x"])
        if kt == "gaussian":
            return sp.GaussianSpatial(sigma_x=d["sigma_x"])
    elif axis == "angular":
        if kt == "legendre":
            return sp.LegendreAngular(coeffs=list(d["coeffs"]))
    raise ValueError(
        f"Unsupported {axis}-kernel type {kt!r}."
    )


# =========================================================================
# Full runner
# =========================================================================



[docs]
def run_workflow(cfg: WorkflowConfig):
    """Execute the full pipeline — expand, build propagators, sweep,
    emit outputs.

    Returns ``(sweep, totals_dataframe)`` for programmatic use.
    """
    system = build_system(cfg.system)

    # ``propagators.diag_C`` is the user-facing knob (the single
    # source of truth for "is C diagonal?"). The symbolic-side
    # ``expand.diag_C`` must agree: with ``propagators.diag_C=False``
    # the closed-form C returns a full (N, N) matrix per sample, but
    # ``expand.diag_C=True`` would collapse the observable (a, b)
    # index pair through ``KroneckerDelta(a, b)`` -- zeroing every
    # cross-component pair at order 0. Reject the contradictory
    # combination with a clear pointer instead of silently rounding
    # the result to zero.
    expand_diag_C = cfg.expand.diag_C
    if (not cfg.propagators.diag_C) and cfg.expand.diag_C:
        # User opted into off-diagonal C but left expand.diag_C at its
        # default (True). Auto-sync so the common case works without
        # forcing users to set the knob twice.
        expand_diag_C = False

    expansion = system.expand(
        observable=cfg.expand.observable,
        orders=cfg.expand.orders,
        response_phase=cfg.expand.response_phase,
        ito=cfg.expand.ito,
        collect_topology=cfg.expand.collect_topology,
        iso_R=cfg.expand.iso_R,
        diag_R=cfg.expand.diag_R,
        diag_C=expand_diag_C,
        iso_C=cfg.expand.iso_C,
        cache_path=cfg.expand.cache_path,
    )

    c_fn = _load_c_closed_form(cfg.propagators)
    # User-supplied C_fn modules are loaded via
    # :func:`_load_callable_from_module`, which registers them under
    # their ``.py`` file's bare stem and adds the parent directory to
    # ``sys.path`` — so the callable is importable in joblib loky
    # subprocesses. Combined with the module-level
    # ``_ClosedFormPropagatorCache`` class, this lets users opt into
    # parallel C-table builds (``propagators.n_jobs: -1``) when their
    # c_fn does heavy work per call.
    n_jobs = cfg.propagators.n_jobs
    props = system.propagators(
        t_max=cfg.propagators.t_max,
        n_grid_t=cfg.propagators.n_grid_t,
        homogeneity=cfg.propagators.homogeneity,
        r_max=cfg.propagators.r_max,
        n_grid_r=cfg.propagators.n_grid_r,
        n_grid_cos=cfg.propagators.n_grid_cos,
        x_max=cfg.propagators.x_max,
        n_grid_x=cfg.propagators.n_grid_x,
        n_jobs=n_jobs,
        c_closed_form=c_fn,
        cache_path=cfg.propagators.cache_path,
        interp_method=cfg.propagators.interp_method,
        c_closed_form_only=cfg.propagators.c_closed_form_only,
        c_closed_form_vectorized=cfg.propagators.c_closed_form_vectorized,
        c_method=cfg.propagators.c_method,
        c_n_gauss=cfg.propagators.c_n_gauss,
        diag_C=cfg.propagators.diag_C,
    )

    # Mutual-exclusion: parallelism layers cannot nest because joblib's
    # loky backend does not support nested process pools. Higher-level
    # ``sweep.n_jobs`` (over Cartesian-product grid points) is forwarded
    # to ``expansion.sweep``; lower-level ``expand.n_jobs`` (over
    # diagrams within a single grid point) is forwarded as
    # ``evaluate_n_jobs``. The downstream :meth:`Expansion.sweep` enforces
    # the ``exactly one of {n_jobs, evaluate_n_jobs} > 1`` invariant.
    if int(cfg.expand.n_jobs) != 1 and int(cfg.sweep.n_jobs) != 1:
        raise ValueError(
            "Specify exactly one of {expand.n_jobs > 1, sweep.n_jobs > 1}; "
            "nested joblib loky pools are not supported."
        )

    sweep = expansion.sweep(
        props,
        positions_grid=cfg.sweep.positions_grid,
        t_final_grid=cfg.sweep.t_final_grid,
        component_pairs=cfg.sweep.component_pairs,
        orders=cfg.sweep.orders,
        vertex_types=cfg.sweep.vertex_types,
        integrate_over=cfg.sweep.integrate_over,
        method=cfg.sweep.method,
        n_samples=cfg.sweep.n_samples,
        seed=cfg.sweep.seed,
        n_jobs=cfg.sweep.n_jobs,
        evaluate_n_jobs=cfg.expand.n_jobs,
        n_gauss=cfg.sweep.n_gauss,
    )

    totals = sweep.totals()
    for out in cfg.output:
        _emit_output(out, sweep, totals)

    return sweep, totals



def _load_c_closed_form(cfg: PropagatorsConfig):
    """Import a user-supplied ``C_fn(n1, t1, n2, t2)`` from the
    ``.py`` file given by ``c_closed_form_module`` in the config.

    Returns ``None`` if the field isn't set.
    """
    if cfg.c_closed_form_module is None:
        return None
    path = Path(cfg.c_closed_form_module).resolve()

    # Register the module under its file basename and put the parent on
    # sys.path AND PYTHONPATH so that joblib loky workers can re-import
    # it when receiving tasks during parallel C-table builds, integration,
    # or sweep dispatch. See ``_load_callable_from_module`` for the same
    # pattern applied to coupling / gamma callables.
    parent_dir = str(path.parent)
    if parent_dir not in sys.path:
        sys.path.append(parent_dir)
    pp = os.environ.get("PYTHONPATH", "")
    pp_parts = pp.split(os.pathsep) if pp else []
    if parent_dir not in pp_parts:
        os.environ["PYTHONPATH"] = os.pathsep.join([parent_dir, *pp_parts])
    module_name = path.stem

    spec_obj = importlib.util.spec_from_file_location(module_name, path)
    if spec_obj is None or spec_obj.loader is None:
        raise ImportError(
            f"Cannot load c_closed_form_module {path!r}."
        )
    module = importlib.util.module_from_spec(spec_obj)
    sys.modules[module_name] = module
    spec_obj.loader.exec_module(module)
    fn = getattr(module, cfg.c_closed_form_attr, None)
    if fn is None:
        raise AttributeError(
            f"Module {path!r} has no attribute "
            f"{cfg.c_closed_form_attr!r}."
        )
    _register_module_by_value(module)
    return fn


def _emit_output(out: OutputConfig, sweep, totals) -> None:
    if out.type == "table":
        payload = _format_table(totals, out.format)
        _write_or_print(payload, out.path)
    elif out.type == "npz":
        if out.path is None:
            raise ValueError("output type 'npz' requires a 'path'.")
        np.savez(
            out.path,
            **{col: totals[col].to_numpy() for col in totals.columns},
        )
    elif out.type == "plot":
        if out.path is None:
            raise ValueError("output type 'plot' requires a 'path'.")
        if out.x is None:
            raise ValueError("output type 'plot' requires 'x'.")
        fig = sweep.plot(
            x=out.x, y=out.y, hue=out.hue, facet_col=out.facet_col,
        )
        fig.savefig(out.path, dpi=120, bbox_inches="tight")


def _format_table(df, fmt: str) -> str:
    if fmt == "markdown":
        return df.to_markdown(index=False)
    if fmt == "csv":
        return df.to_csv(index=False)
    if fmt == "plain":
        return df.to_string(index=False)
    raise ValueError(
        f"output.format must be 'markdown', 'csv', or 'plain'; got {fmt!r}."
    )


def _write_or_print(payload: str, path: Any) -> None:
    if path is None:
        print(payload)
    else:
        Path(path).parent.mkdir(parents=True, exist_ok=True)
        Path(path).write_text(payload)