From d209ec3068459708ef46ece12a925f4aa954332c Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 10 Jun 2026 17:19:17 +0000
Subject: [PATCH] feat: add Monte Carlo uncertainty propagation module
 (gpu_stack.uncertainty)

Adds `gpu_stack/uncertainty.py` with UncertainAssignment, three distribution
types (uniform, normal, lognormal), and `propagate_uncertainty` that resolves
targets over n_samples draws. Uses SymPy lambdify fast-path for vectorised
evaluation (200 samples in <1 ms vs ~14 s per-sample) with fallback to
per-sample resolver. Returns structured TargetUncertaintyStats with mean,
sample std, p5/p50/p95, failure count, and echoed input specs. 35 tests cover
determinism, quantile ordering, analytic correctness, failure counting, and
all three distribution types.

https://claude.ai/code/session_01Eu2JVnPFgMQftwYTP3cGQZ
---
 gpu_stack/uncertainty.py  | 674 ++++++++++++++++++++++++++++++++++++++
 tests/test_uncertainty.py | 670 +++++++++++++++++++++++++++++++++++++
 2 files changed, 1344 insertions(+)
 create mode 100644 gpu_stack/uncertainty.py
 create mode 100644 tests/test_uncertainty.py

diff --git a/gpu_stack/uncertainty.py b/gpu_stack/uncertainty.py
new file mode 100644
index 0000000..f0b5c5e
--- /dev/null
+++ b/gpu_stack/uncertainty.py
@@ -0,0 +1,674 @@
+"""
+gpu_stack.uncertainty
+=====================
+
+Monte Carlo uncertainty propagation over the existing symbolic resolver.
+
+The module never invents numbers. Every distribution must be supplied
+explicitly by the caller; there are no default uncertainties.
+
+Public API
+----------
+UncertainAssignment(name, distribution)
+    Pairs a registered variable name with a distribution object.
+
+uniform(low, high)
+normal(mean, std)
+lognormal(mu, sigma)
+    Distribution constructors. Each validates sign assumptions of the target
+    variable when UncertainAssignment is constructed.
+
+propagate_uncertainty(preset_or_assignments, targets, uncertain, n_samples, seed)
+    Monte Carlo driver. Resolves each target over n_samples draws, collecting
+    per-target statistics.
+
+UncertaintyResult, TargetUncertaintyStats
+    Structured result artifacts with to_dict() for JSON-friendly output.
+
+Performance note
+----------------
+When the symbolic resolver can form a closed-form expression over the uncertain
+inputs (i.e., the expression remains symbolic after omitting those inputs), the
+driver lambdifies that expression and vectorises the sample evaluation over all
+n_samples at once via SymPy's lambdify. This reduces 200-sample evaluation from
+~14 s (per-sample resolve) to under 1 ms. When lambdification is not possible
+(the expression would require re-resolving a variant branching or similar), the
+driver falls back to per-sample resolution through the existing public
+resolve() path.
+"""
+
+from __future__ import annotations
+
+import math
+from dataclasses import dataclass, field
+from typing import (
+    Any,
+    Dict,
+    Iterable,
+    List,
+    Mapping,
+    Optional,
+    Sequence,
+    Tuple,
+    Union,
+)
+
+import sympy as sp
+
+from .core.presets import Preset
+from .core.registry import Registry
+from .core.resolver import ResolverError, resolve
+
+
+# ---------------------------------------------------------------------------
+# Distribution types
+# ---------------------------------------------------------------------------
+
+@dataclass(frozen=True)
+class _UniformDist:
+    """Uniform distribution on [low, high]."""
+
+    kind: str = field(default="uniform", init=False)
+    low: float
+    high: float
+
+    def __post_init__(self) -> None:
+        if self.low > self.high:
+            raise ValueError(
+                f"uniform: low ({self.low}) must be <= high ({self.high})"
+            )
+
+    def has_mass_at_nonpositive(self) -> bool:
+        return self.low <= 0.0
+
+    def has_mass_at_negative(self) -> bool:
+        return self.low < 0.0
+
+    def to_dict(self) -> Dict[str, object]:
+        return {"kind": self.kind, "low": self.low, "high": self.high}
+
+
+@dataclass(frozen=True)
+class _NormalDist:
+    """Normal (Gaussian) distribution."""
+
+    kind: str = field(default="normal", init=False)
+    mean: float
+    std: float
+
+    def __post_init__(self) -> None:
+        if self.std <= 0.0:
+            raise ValueError(
+                f"normal: std ({self.std}) must be > 0"
+            )
+
+    def has_mass_at_nonpositive(self) -> bool:
+        # Normal has infinite support; always has some mass at nonpositive.
+        return True
+
+    def has_mass_at_negative(self) -> bool:
+        return True
+
+    def to_dict(self) -> Dict[str, object]:
+        return {"kind": self.kind, "mean": self.mean, "std": self.std}
+
+
+@dataclass(frozen=True)
+class _LognormalDist:
+    """
+    Log-normal distribution: if X ~ Lognormal(mu, sigma), then
+    log(X) ~ Normal(mu, sigma). Support is strictly (0, +inf).
+    """
+
+    kind: str = field(default="lognormal", init=False)
+    mu: float
+    sigma: float
+
+    def __post_init__(self) -> None:
+        if self.sigma <= 0.0:
+            raise ValueError(
+                f"lognormal: sigma ({self.sigma}) must be > 0"
+            )
+
+    def has_mass_at_nonpositive(self) -> bool:
+        return False
+
+    def has_mass_at_negative(self) -> bool:
+        return False
+
+    def to_dict(self) -> Dict[str, object]:
+        return {"kind": self.kind, "mu": self.mu, "sigma": self.sigma}
+
+
+Distribution = Union[_UniformDist, _NormalDist, _LognormalDist]
+
+
+def uniform(low: float, high: float) -> _UniformDist:
+    """Uniform distribution on [low, high]."""
+    return _UniformDist(low=low, high=high)
+
+
+def normal(mean: float, std: float) -> _NormalDist:
+    """Normal distribution with given mean and standard deviation."""
+    return _NormalDist(mean=mean, std=std)
+
+
+def lognormal(mu: float, sigma: float) -> _LognormalDist:
+    """
+    Log-normal distribution parameterised by the mean (mu) and standard
+    deviation (sigma) of the underlying normal in log-space.
+    """
+    return _LognormalDist(mu=mu, sigma=sigma)
+
+
+# ---------------------------------------------------------------------------
+# UncertainAssignment
+# ---------------------------------------------------------------------------
+
+@dataclass(frozen=True)
+class UncertainAssignment:
+    """
+    Pairs a registered variable name with a distribution.
+
+    Validation
+    ----------
+    If the target variable has a ``positive=True`` SymPy assumption, any
+    distribution that places mass at non-positive values is rejected. If the
+    variable has a ``nonnegative=True`` assumption, distributions with mass at
+    strictly negative values are rejected.
+    """
+
+    name: str
+    distribution: Distribution
+
+    def __post_init__(self) -> None:
+        var = Registry.variables.get(self.name)
+        if var is None:
+            raise ValueError(
+                f"UncertainAssignment: unknown variable name {self.name!r}"
+            )
+        sym = var.symbol
+        if sym.is_positive:
+            if self.distribution.has_mass_at_nonpositive():
+                raise ValueError(
+                    f"UncertainAssignment({self.name!r}): variable has "
+                    f"positive=True assumption but distribution "
+                    f"{self.distribution.to_dict()} has mass at non-positive "
+                    "values. Use lognormal or a uniform distribution with "
+                    "low > 0."
+                )
+        elif sym.is_nonnegative:
+            if self.distribution.has_mass_at_negative():
+                raise ValueError(
+                    f"UncertainAssignment({self.name!r}): variable has "
+                    f"nonnegative=True assumption but distribution "
+                    f"{self.distribution.to_dict()} has mass at negative "
+                    "values. Use lognormal or a uniform distribution with "
+                    "low >= 0."
+                )
+
+    def to_dict(self) -> Dict[str, object]:
+        return {"name": self.name, "distribution": self.distribution.to_dict()}
+
+
+# ---------------------------------------------------------------------------
+# Result artifacts
+# ---------------------------------------------------------------------------
+
+@dataclass(frozen=True)
+class TargetUncertaintyStats:
+    """
+    Per-target statistics from a Monte Carlo propagation run.
+
+    Fields
+    ------
+    label       : caller-supplied label for the target.
+    target      : registered variable name (string form).
+    sample_count: number of samples drawn (equals n_samples).
+    failure_count: samples where resolution errored or returned a
+                  non-finite value (div-by-zero, complex infinity, etc.).
+    mean        : sample mean of the finite resolved values.
+    std         : sample standard deviation.
+    p5          : 5th percentile.
+    p50         : 50th percentile (median).
+    p95         : 95th percentile.
+    input_specs : the UncertainAssignment inputs echoed back.
+    """
+
+    label: str
+    target: str
+    sample_count: int
+    failure_count: int
+    mean: Optional[float]
+    std: Optional[float]
+    p5: Optional[float]
+    p50: Optional[float]
+    p95: Optional[float]
+    input_specs: Tuple[UncertainAssignment, ...]
+
+    def to_dict(self) -> Dict[str, object]:
+        return {
+            "label": self.label,
+            "target": self.target,
+            "sample_count": self.sample_count,
+            "failure_count": self.failure_count,
+            "mean": self.mean,
+            "std": self.std,
+            "p5": self.p5,
+            "p50": self.p50,
+            "p95": self.p95,
+            "input_specs": [spec.to_dict() for spec in self.input_specs],
+        }
+
+
+@dataclass(frozen=True)
+class UncertaintyResult:
+    """
+    Full result of a Monte Carlo propagation run.
+
+    Fields
+    ------
+    preset_name  : name of the preset used.
+    n_samples    : number of samples requested.
+    seed         : RNG seed used (None if no seed was supplied).
+    targets      : per-target stats, in the same order as the targets arg.
+    input_specs  : all UncertainAssignment inputs echoed back.
+    """
+
+    preset_name: str
+    n_samples: int
+    seed: Optional[int]
+    targets: Tuple[TargetUncertaintyStats, ...]
+    input_specs: Tuple[UncertainAssignment, ...]
+
+    def to_dict(self) -> Dict[str, object]:
+        return {
+            "preset_name": self.preset_name,
+            "n_samples": self.n_samples,
+            "seed": self.seed,
+            "input_specs": [spec.to_dict() for spec in self.input_specs],
+            "targets": {t.label: t.to_dict() for t in self.targets},
+        }
+
+
+# ---------------------------------------------------------------------------
+# Internal helpers
+# ---------------------------------------------------------------------------
+
+def _draw_samples(
+    dist: Distribution,
+    n: int,
+    rng: Any,
+) -> List[float]:
+    """Draw n samples from dist using the provided numpy rng."""
+    if isinstance(dist, _UniformDist):
+        return list(rng.uniform(dist.low, dist.high, n))
+    if isinstance(dist, _NormalDist):
+        return list(rng.normal(dist.mean, dist.std, n))
+    if isinstance(dist, _LognormalDist):
+        return list(rng.lognormal(dist.mu, dist.sigma, n))
+    raise TypeError(f"unsupported distribution type: {type(dist)}")
+
+
+def _sympy_value_to_float(v: object) -> Optional[float]:
+    """Convert a SymPy expression to float, returning None on failure."""
+    if hasattr(v, "free_symbols") and v.free_symbols:
+        return None
+    try:
+        f = float(v)
+        return f if math.isfinite(f) else None
+    except (TypeError, ValueError):
+        return None
+
+
+def _percentile_of_sorted(sorted_vals: List[float], q: float) -> float:
+    """
+    Linear interpolation percentile from a sorted list. q in [0.0, 1.0].
+    """
+    n = len(sorted_vals)
+    if n == 0:
+        return float("nan")
+    idx = q * (n - 1)
+    lo = int(idx)
+    hi = lo + 1
+    if hi >= n:
+        return sorted_vals[-1]
+    frac = idx - lo
+    return sorted_vals[lo] + frac * (sorted_vals[hi] - sorted_vals[lo])
+
+
+def _compute_stats(
+    label: str,
+    target: str,
+    samples: List[Optional[float]],
+    input_specs: Tuple[UncertainAssignment, ...],
+) -> TargetUncertaintyStats:
+    n_total = len(samples)
+    finite = [s for s in samples if s is not None]
+    n_fail = n_total - len(finite)
+
+    if not finite:
+        return TargetUncertaintyStats(
+            label=label,
+            target=target,
+            sample_count=n_total,
+            failure_count=n_fail,
+            mean=None,
+            std=None,
+            p5=None,
+            p50=None,
+            p95=None,
+            input_specs=input_specs,
+        )
+
+    n = len(finite)
+    mean = sum(finite) / n
+    # Sample standard deviation (Bessel-corrected, divide by n-1).
+    # Returns 0 for n==1 since no spread can be estimated from one sample.
+    variance = sum((x - mean) ** 2 for x in finite) / (n - 1) if n > 1 else 0.0
+    std = math.sqrt(variance)
+    sorted_finite = sorted(finite)
+
+    return TargetUncertaintyStats(
+        label=label,
+        target=target,
+        sample_count=n_total,
+        failure_count=n_fail,
+        mean=mean,
+        std=std,
+        p5=_percentile_of_sorted(sorted_finite, 0.05),
+        p50=_percentile_of_sorted(sorted_finite, 0.50),
+        p95=_percentile_of_sorted(sorted_finite, 0.95),
+        input_specs=input_specs,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Fast path: symbolic resolve + lambdify
+# ---------------------------------------------------------------------------
+
+def _try_lambdify_path(
+    uncertain_names: Sequence[str],
+    base_assignments: Dict[str, float],
+    base_variants: Dict[str, str],
+    target_name: str,
+) -> Optional[Tuple[Any, List[str]]]:
+    """
+    Attempt to build a lambdified function for target_name with uncertain_names
+    left as free symbols. Returns the callable or None if it fails.
+
+    The callable signature is f(*sample_arrays) -> numpy array, where each
+    positional argument corresponds to the sorted order of symbols that appear
+    free in the resolved expression. The returned callable and a list of the
+    symbol names (in that order) are returned as a 2-tuple.
+    """
+    partial_assignments = {
+        k: v for k, v in base_assignments.items()
+        if k not in uncertain_names
+    }
+    try:
+        result = resolve(
+            target_name,
+            assignments=partial_assignments,
+            variants=base_variants,
+        )
+    except ResolverError:
+        return None
+
+    expr = result.value
+    free = expr.free_symbols
+    if not free:
+        # Fully deterministic - no uncertain inputs influence this target.
+        # Still valid; lambdify will return a constant.
+        ordered_syms: List[sp.Symbol] = []
+    else:
+        ordered_syms = sorted(free, key=str)
+
+    # Map symbol name -> uncertain variable name
+    sym_to_uncertain: Dict[str, str] = {}
+    for uname in uncertain_names:
+        var = Registry.variables[uname]
+        sym_name = str(var.symbol)
+        if var.symbol in free or sym_name in [str(s) for s in free]:
+            sym_to_uncertain[str(var.symbol)] = uname
+
+    # Check that all free symbols correspond to our uncertain inputs.
+    # If there are extra free symbols (other missing inputs) we cannot
+    # use the lambdify path reliably.
+    for sym in ordered_syms:
+        if str(sym) not in sym_to_uncertain:
+            # Some other variable is also missing - lambdify is not safe.
+            return None
+
+    try:
+        lam = sp.lambdify(ordered_syms, expr, modules="numpy")
+    except Exception:
+        return None
+
+    return lam, [sym_to_uncertain[str(s)] for s in ordered_syms]
+
+
+# ---------------------------------------------------------------------------
+# Public driver
+# ---------------------------------------------------------------------------
+
+def propagate_uncertainty(
+    preset_or_assignments: Union[Preset, Mapping[str, float]],
+    targets: Iterable[Tuple[str, str]],
+    uncertain: Sequence[UncertainAssignment],
+    n_samples: int = 200,
+    seed: Optional[int] = None,
+) -> UncertaintyResult:
+    """
+    Monte Carlo uncertainty propagation over the existing resolver.
+
+    Parameters
+    ----------
+    preset_or_assignments
+        A Preset or a plain dict of assignments. When a Preset is supplied its
+        variant selections are also forwarded to the resolver.
+    targets
+        Iterable of (label, target_name) pairs, same convention as
+        Preset.evaluate_targets.
+    uncertain
+        Sequence of UncertainAssignment objects specifying which inputs have
+        distributions. The caller must supply all distributions explicitly;
+        no defaults are invented.
+    n_samples
+        Number of Monte Carlo samples. Must be >= 1.
+    seed
+        Integer seed for the random number generator. When provided the run is
+        fully deterministic: identical seed, preset, targets, and uncertain
+        inputs always produce identical results.
+
+    Returns
+    -------
+    UncertaintyResult with per-target statistics and the input spec echoed back.
+
+    Performance
+    -----------
+    When the resolver can form a closed-form symbolic expression over the
+    uncertain inputs (which is the common case for linear economics chains),
+    the driver lambdifies that expression and evaluates all samples at once.
+    For targets that require per-sample resolver calls, evaluation runs at
+    roughly 70 ms/sample on a typical workstation; keep n_samples small
+    (<=50) for interactive use when lambdification is not available.
+    """
+    try:
+        import numpy as _np
+        _has_numpy = True
+    except ImportError:
+        _has_numpy = False
+
+    if n_samples < 1:
+        raise ValueError(f"n_samples must be >= 1, got {n_samples}")
+    if not uncertain:
+        raise ValueError("uncertain must contain at least one UncertainAssignment")
+
+    # Build base assignments and variants.
+    if isinstance(preset_or_assignments, Preset):
+        base_assignments: Dict[str, float] = dict(preset_or_assignments.assignments)
+        base_variants: Dict[str, str] = dict(preset_or_assignments.variants)
+        preset_name = preset_or_assignments.name
+    else:
+        base_assignments = dict(preset_or_assignments)
+        base_variants = {}
+        preset_name = "<assignments>"
+
+    # Validate that there are no duplicate uncertain variable names.
+    seen_names: List[str] = []
+    for ua in uncertain:
+        if ua.name in seen_names:
+            raise ValueError(
+                f"propagate_uncertainty: uncertain variable {ua.name!r} appears "
+                "more than once in the uncertain list. Each variable must appear "
+                "at most once."
+            )
+        seen_names.append(ua.name)
+
+    # Validate that all uncertain names are also in the base assignments.
+    for ua in uncertain:
+        if ua.name not in base_assignments:
+            raise ValueError(
+                f"propagate_uncertainty: uncertain variable {ua.name!r} is not "
+                "present in the preset/assignments dict. The base assignment "
+                "provides the nominal value; add it before marking it uncertain."
+            )
+
+    targets_list = list(targets)
+    input_specs = tuple(uncertain)
+    uncertain_names = [ua.name for ua in uncertain]
+
+    # Build RNG. We use numpy when available (needed for lambdify path anyway).
+    if _has_numpy:
+        rng = _np.random.default_rng(seed)
+        # Pre-draw all sample arrays, one per uncertain variable.
+        sample_arrays: Dict[str, List[float]] = {
+            ua.name: _draw_samples(ua.distribution, n_samples, rng)
+            for ua in uncertain
+        }
+    else:
+        import random
+        _rng = random.Random(seed)
+
+        class _PurePythonRNG:
+            def uniform(self, lo, hi, n):
+                return [_rng.uniform(lo, hi) for _ in range(n)]
+
+            def normal(self, mu, sigma, n):
+                return [_rng.gauss(mu, sigma) for _ in range(n)]
+
+            def lognormal(self, mu, sigma, n):
+                import math as _m
+                return [_m.exp(_rng.gauss(mu, sigma)) for _ in range(n)]
+
+        py_rng = _PurePythonRNG()
+        sample_arrays = {
+            ua.name: _draw_samples(ua.distribution, n_samples, py_rng)
+            for ua in uncertain
+        }
+
+    target_stats_list: List[TargetUncertaintyStats] = []
+
+    for label, target_name in targets_list:
+        # -- attempt fast lambdify path --
+        lambdify_result = _try_lambdify_path(
+            uncertain_names,
+            base_assignments,
+            base_variants,
+            target_name,
+        )
+
+        if lambdify_result is not None:
+            lam, ordered_names = lambdify_result
+            if _has_numpy:
+                arrays = [
+                    _np.asarray(sample_arrays[name], dtype=float)
+                    for name in ordered_names
+                ]
+                try:
+                    raw = lam(*arrays) if ordered_names else lam()
+                    # raw may be a scalar if the expression is constant
+                    vals = _np.asarray(raw, dtype=float).flatten()
+                    if vals.size == 1:
+                        vals = _np.full(n_samples, vals[0])
+                    float_samples: List[Optional[float]] = [
+                        v if math.isfinite(v) else None
+                        for v in vals.tolist()
+                    ]
+                except Exception:
+                    float_samples = None
+            else:
+                # pure-python lambdify path
+                try:
+                    rows = [sample_arrays[name] for name in ordered_names]
+                    if rows:
+                        float_samples = []
+                        for i in range(n_samples):
+                            args = [rows[j][i] for j in range(len(rows))]
+                            v = lam(*args)
+                            try:
+                                fv = float(v)
+                                float_samples.append(fv if math.isfinite(fv) else None)
+                            except (TypeError, ValueError):
+                                float_samples.append(None)
+                    else:
+                        v = lam()
+                        try:
+                            fv = float(v)
+                            float_samples = [
+                                fv if math.isfinite(fv) else None
+                            ] * n_samples
+                        except (TypeError, ValueError):
+                            float_samples = [None] * n_samples
+                except Exception:
+                    float_samples = None
+
+            if float_samples is not None:
+                target_stats_list.append(
+                    _compute_stats(label, target_name, float_samples, input_specs)
+                )
+                continue
+
+        # -- fallback: per-sample resolve --
+        float_samples_fallback: List[Optional[float]] = []
+        for i in range(n_samples):
+            overrides = {name: sample_arrays[name][i] for name in uncertain_names}
+            sample_assignments = dict(base_assignments)
+            sample_assignments.update(overrides)
+            try:
+                result = resolve(
+                    target_name,
+                    assignments=sample_assignments,
+                    variants=base_variants,
+                )
+                fv = _sympy_value_to_float(result.value)
+                float_samples_fallback.append(fv)
+            except ResolverError:
+                float_samples_fallback.append(None)
+
+        target_stats_list.append(
+            _compute_stats(
+                label, target_name, float_samples_fallback, input_specs
+            )
+        )
+
+    return UncertaintyResult(
+        preset_name=preset_name,
+        n_samples=n_samples,
+        seed=seed,
+        targets=tuple(target_stats_list),
+        input_specs=input_specs,
+    )
+
+
+__all__ = [
+    "UncertainAssignment",
+    "UncertaintyResult",
+    "TargetUncertaintyStats",
+    "Distribution",
+    "uniform",
+    "normal",
+    "lognormal",
+    "propagate_uncertainty",
+]
diff --git a/tests/test_uncertainty.py b/tests/test_uncertainty.py
new file mode 100644
index 0000000..aa139e0
--- /dev/null
+++ b/tests/test_uncertainty.py
@@ -0,0 +1,670 @@
+"""
+Tests for gpu_stack.uncertainty -- Monte Carlo propagation.
+
+All uncertain ranges used here are SYNTHETIC FIXTURES chosen for
+deterministic testability; they are not historical data, vendor
+specifications, or price recommendations.
+"""
+
+from __future__ import annotations
+
+import math
+from typing import Optional
+
+import pytest
+
+from gpu_stack.uncertainty import (
+    Distribution,
+    TargetUncertaintyStats,
+    UncertainAssignment,
+    UncertaintyResult,
+    lognormal,
+    normal,
+    propagate_uncertainty,
+    uniform,
+)
+from gpu_stack.presets import scenarios
+
+
+# ---------------------------------------------------------------------------
+# Synthetic fixture helpers
+# ---------------------------------------------------------------------------
+
+SYNTHETIC_PRESET = scenarios.dense_training_cost_fixture
+
+# SYNTHETIC: electricity price range 0.25--0.45 $/kWh, chosen for
+# round-number test arithmetic; not a market data range.
+SYNTH_PRICE_UNIFORM = uniform(0.25, 0.45)
+
+# SYNTHETIC: cluster availability 0.85--1.0, round-number assumption.
+SYNTH_AVAIL_UNIFORM = uniform(0.85, 1.0)
+
+# SYNTHETIC: normal distribution over electricity price; mean=0.36, std=0.05.
+SYNTH_PRICE_NORMAL = normal(mean=0.36, std=0.05)
+
+# SYNTHETIC: log-normal over power price; mu=log(0.36), sigma=0.1 (approx 10%).
+import math as _math
+SYNTH_PRICE_LOGNORMAL = lognormal(mu=_math.log(0.36), sigma=0.1)
+
+UNCERTAIN_PRICE = UncertainAssignment(
+    "econ.power.price_kwh_peak",
+    SYNTH_PRICE_UNIFORM,
+)
+UNCERTAIN_OFFPEAK = UncertainAssignment(
+    "econ.power.price_kwh_offpeak",
+    SYNTH_PRICE_UNIFORM,
+)
+UNCERTAIN_AVAIL = UncertainAssignment(
+    "training.cluster_availability",
+    SYNTH_AVAIL_UNIFORM,
+)
+
+COST_TARGET = ("cost_per_token", "econ.cost.per_token")
+POWER_TARGET = ("job_dc_power", "econ.job.dc_power")
+
+
+# ---------------------------------------------------------------------------
+# Distribution constructor validation
+# ---------------------------------------------------------------------------
+
+def test_uniform_requires_low_le_high():
+    with pytest.raises(ValueError, match="low.*<=.*high"):
+        uniform(0.5, 0.3)
+
+
+def test_uniform_equal_bounds_is_valid():
+    d = uniform(0.36, 0.36)
+    assert d.low == 0.36
+    assert d.high == 0.36
+
+
+def test_normal_requires_positive_std():
+    with pytest.raises(ValueError, match="std"):
+        normal(0.36, -0.01)
+    with pytest.raises(ValueError, match="std"):
+        normal(0.36, 0.0)
+
+
+def test_lognormal_requires_positive_sigma():
+    with pytest.raises(ValueError, match="sigma"):
+        lognormal(0.0, 0.0)
+    with pytest.raises(ValueError, match="sigma"):
+        lognormal(0.0, -0.1)
+
+
+def test_distribution_to_dict_shapes():
+    assert uniform(0.2, 0.4).to_dict() == {
+        "kind": "uniform", "low": 0.2, "high": 0.4
+    }
+    assert normal(0.36, 0.05).to_dict() == {
+        "kind": "normal", "mean": 0.36, "std": 0.05
+    }
+    assert lognormal(0.0, 0.1).to_dict() == {
+        "kind": "lognormal", "mu": 0.0, "sigma": 0.1
+    }
+
+
+# ---------------------------------------------------------------------------
+# UncertainAssignment validation
+# ---------------------------------------------------------------------------
+
+def test_uncertain_assignment_rejects_unknown_variable():
+    with pytest.raises(ValueError, match="unknown variable"):
+        UncertainAssignment("no.such.variable", uniform(0.1, 0.9))
+
+
+def test_uncertain_assignment_accepts_real_only_variable():
+    # econ.power.price_kwh_peak has real=True, no sign assumption -> accept any
+    ua = UncertainAssignment("econ.power.price_kwh_peak", uniform(0.25, 0.45))
+    assert ua.name == "econ.power.price_kwh_peak"
+
+
+def test_uncertain_assignment_to_dict_echoes_spec():
+    ua = UncertainAssignment("econ.power.price_kwh_peak", uniform(0.25, 0.45))
+    d = ua.to_dict()
+    assert d["name"] == "econ.power.price_kwh_peak"
+    assert d["distribution"]["kind"] == "uniform"
+    assert d["distribution"]["low"] == 0.25
+
+
+def test_uncertain_assignment_rejects_normal_for_positive_variable():
+    """
+    SYNTHETIC: physics.speed_of_light has positive=True. Normal dist has
+    mass at negative values, so it must be rejected.
+    """
+    from gpu_stack import Registry
+    positive_vars = [
+        name for name, v in Registry.variables.items()
+        if v.symbol.is_positive
+    ]
+    assert positive_vars, "need at least one positive-assumption variable"
+    target = positive_vars[0]
+    with pytest.raises(ValueError, match="positive=True"):
+        UncertainAssignment(target, normal(mean=1.0, std=0.5))
+
+
+def test_uncertain_assignment_rejects_negative_uniform_for_positive_variable():
+    from gpu_stack import Registry
+    positive_vars = [
+        name for name, v in Registry.variables.items()
+        if v.symbol.is_positive
+    ]
+    assert positive_vars
+    target = positive_vars[0]
+    with pytest.raises(ValueError, match="positive=True"):
+        UncertainAssignment(target, uniform(-1.0, 1.0))
+
+
+def test_uncertain_assignment_accepts_lognormal_for_positive_variable():
+    from gpu_stack import Registry
+    positive_vars = [
+        name for name, v in Registry.variables.items()
+        if v.symbol.is_positive
+    ]
+    assert positive_vars
+    target = positive_vars[0]
+    # lognormal never places mass at non-positive values - should be accepted
+    ua = UncertainAssignment(target, lognormal(mu=0.0, sigma=0.1))
+    assert ua.name == target
+
+
+# ---------------------------------------------------------------------------
+# propagate_uncertainty: input validation
+# ---------------------------------------------------------------------------
+
+def test_propagate_uncertainty_requires_nonempty_uncertain():
+    with pytest.raises(ValueError, match="uncertain must contain"):
+        propagate_uncertainty(
+            SYNTHETIC_PRESET,
+            [COST_TARGET],
+            uncertain=[],
+            n_samples=10,
+            seed=0,
+        )
+
+
+def test_propagate_uncertainty_requires_positive_n_samples():
+    with pytest.raises(ValueError, match="n_samples must be >= 1"):
+        propagate_uncertainty(
+            SYNTHETIC_PRESET,
+            [COST_TARGET],
+            uncertain=[UNCERTAIN_PRICE],
+            n_samples=0,
+            seed=0,
+        )
+
+
+def test_propagate_uncertainty_rejects_duplicate_uncertain_variable():
+    """Duplicate variable names in uncertain list must raise ValueError."""
+    ua1 = UncertainAssignment("econ.power.price_kwh_peak", uniform(0.25, 0.35))
+    ua2 = UncertainAssignment("econ.power.price_kwh_peak", uniform(0.30, 0.45))
+    with pytest.raises(ValueError, match="appears more than once"):
+        propagate_uncertainty(
+            SYNTHETIC_PRESET,
+            [COST_TARGET],
+            uncertain=[ua1, ua2],
+            n_samples=5,
+            seed=0,
+        )
+
+
+def test_propagate_uncertainty_requires_uncertain_var_in_base_assignments():
+    """Uncertain variable must be present in the preset assignments."""
+    from gpu_stack.uncertainty import UncertainAssignment, uniform
+    # training.total_tokens is a valid variable but not in our preset's
+    # uncertain list - but it IS in the preset assignments, so we need one
+    # that isn't. Use a valid registered name that isn't assigned.
+    ua_missing = UncertainAssignment(
+        "econ.power.price_kwh_peak",
+        uniform(0.25, 0.45),
+    )
+    # Pass a plain dict without that key
+    empty_assignments = {}
+    with pytest.raises(ValueError, match="not present"):
+        propagate_uncertainty(
+            empty_assignments,
+            [COST_TARGET],
+            uncertain=[ua_missing],
+            n_samples=5,
+            seed=0,
+        )
+
+
+# ---------------------------------------------------------------------------
+# Determinism by seed
+# ---------------------------------------------------------------------------
+
+def test_propagate_uncertainty_is_deterministic_with_same_seed():
+    """Same seed must produce identical results."""
+    kwargs = dict(
+        preset_or_assignments=SYNTHETIC_PRESET,
+        targets=[COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=20,
+        seed=42,
+    )
+    r1 = propagate_uncertainty(**kwargs)
+    r2 = propagate_uncertainty(**kwargs)
+
+    t1 = r1.targets[0]
+    t2 = r2.targets[0]
+    assert t1.mean == t2.mean
+    assert t1.std == t2.std
+    assert t1.p5 == t2.p5
+    assert t1.p95 == t2.p95
+    assert t1.failure_count == t2.failure_count
+
+
+def test_propagate_uncertainty_different_seeds_produce_different_results():
+    """Different seeds should (overwhelmingly likely) produce different means."""
+    r1 = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=30,
+        seed=1,
+    )
+    r2 = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=30,
+        seed=2,
+    )
+    # With 30 samples from a uniform over a reasonably wide range, means
+    # will almost certainly differ.
+    assert r1.targets[0].mean != r2.targets[0].mean
+
+
+# ---------------------------------------------------------------------------
+# Sane quantile ordering
+# ---------------------------------------------------------------------------
+
+def test_quantile_ordering_p5_le_p50_le_p95():
+    """p5 <= p50 <= p95 must hold for any well-behaved distribution."""
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=50,
+        seed=7,
+    )
+    t = result.targets[0]
+    assert t.p5 is not None
+    assert t.p50 is not None
+    assert t.p95 is not None
+    assert t.p5 <= t.p50
+    assert t.p50 <= t.p95
+
+
+def test_quantile_ordering_with_two_uncertain_inputs():
+    """Quantile ordering holds with two uncertain inputs."""
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE, UNCERTAIN_AVAIL],
+        n_samples=50,
+        seed=11,
+    )
+    t = result.targets[0]
+    assert t.p5 is not None
+    assert t.p5 <= t.p50 <= t.p95
+
+
+# ---------------------------------------------------------------------------
+# Propagation correctness on a hand-checkable linear case
+# ---------------------------------------------------------------------------
+#
+# The dense_training_cost_fixture resolves cost_per_token through a linear
+# chain. After symbolic resolution with price as the free variable, the
+# expression has the form:
+#
+#   cost_per_token = alpha * price_kwh_peak + beta
+#
+# With price_kwh_peak ~ Uniform(low, high) and all other inputs fixed:
+#   E[cost] = alpha * (low + high)/2 + beta
+#   Var[cost] = alpha^2 * (high - low)^2 / 12
+#
+# We verify these analytically against the Monte Carlo estimates.
+
+def test_propagation_matches_analytic_mean_for_linear_case():
+    """
+    SYNTHETIC: electricity price uniform(0.25, 0.45) is a synthetic range.
+    Linear propagation through cost_per_token gives an analytic mean.
+    """
+    from gpu_stack import resolve, Registry
+
+    preset = SYNTHETIC_PRESET
+    base_assignments = dict(preset.assignments)
+    base_variants = dict(preset.variants)
+
+    # Resolve symbolically omitting the price variable.
+    partial = {k: v for k, v in base_assignments.items()
+               if k != "econ.power.price_kwh_peak"}
+    sym_result = resolve(
+        "econ.cost.per_token",
+        assignments=partial,
+        variants=base_variants,
+    )
+    expr = sym_result.value
+    price_sym = Registry.variables["econ.power.price_kwh_peak"].symbol
+    alpha = float(expr.diff(price_sym))
+    beta = float(expr.subs(price_sym, 0))
+
+    low, high = 0.25, 0.45
+    analytic_mean = alpha * (low + high) / 2.0 + beta
+
+    # 200 samples is sufficient for a linear case (lambdify path = vectorized).
+    result = propagate_uncertainty(
+        preset,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=200,
+        seed=99,
+    )
+    t = result.targets[0]
+    assert t.mean is not None
+    assert t.failure_count == 0
+    # Tolerance is 0.5% relative; linear case converges rapidly.
+    assert abs(t.mean - analytic_mean) / analytic_mean < 0.005, (
+        f"MC mean {t.mean:.4e} vs analytic {analytic_mean:.4e}"
+    )
+
+
+def test_propagation_matches_analytic_std_for_linear_case():
+    """
+    SYNTHETIC: same as above but checking standard deviation.
+    """
+    from gpu_stack import resolve, Registry
+
+    preset = SYNTHETIC_PRESET
+    base_assignments = dict(preset.assignments)
+    base_variants = dict(preset.variants)
+
+    partial = {k: v for k, v in base_assignments.items()
+               if k != "econ.power.price_kwh_peak"}
+    sym_result = resolve(
+        "econ.cost.per_token",
+        assignments=partial,
+        variants=base_variants,
+    )
+    expr = sym_result.value
+    price_sym = Registry.variables["econ.power.price_kwh_peak"].symbol
+    alpha = float(expr.diff(price_sym))
+
+    low, high = 0.25, 0.45
+    # Analytic std for uniform: (high - low) / sqrt(12).
+    # The code reports sample std (Bessel-corrected, divide by n-1).
+    # For large n, population and sample std converge; we tolerate 10%.
+    analytic_std = abs(alpha) * (high - low) / (12 ** 0.5)
+
+    # 500 samples with lambdify is fast and gives good std estimate.
+    result = propagate_uncertainty(
+        preset,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=500,
+        seed=77,
+    )
+    t = result.targets[0]
+    assert t.std is not None
+    # 10% tolerance on std is generous for sample std with 500 samples.
+    assert abs(t.std - analytic_std) / analytic_std < 0.10, (
+        f"MC std {t.std:.4e} vs analytic {analytic_std:.4e}"
+    )
+
+
+# ---------------------------------------------------------------------------
+# Failure-count behavior
+# ---------------------------------------------------------------------------
+
+def test_failure_count_is_zero_for_well_behaved_inputs():
+    """A valid range with no division by zero or infeasibility = 0 failures."""
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=100,
+        seed=3,
+    )
+    assert result.targets[0].failure_count == 0
+
+
+def test_failure_count_nonzero_when_samples_cause_zero_division():
+    """
+    SYNTHETIC: cluster_availability near zero causes division by zero in
+    the cost_per_token formula (wallclock = t_step / availability). A
+    uniform distribution that includes zero will produce failures.
+    """
+    # SYNTHETIC: availability range includes zero to force failures
+    dangerous_avail = UncertainAssignment(
+        "training.cluster_availability",
+        uniform(0.0, 0.0),  # constant zero - all samples fail
+    )
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[dangerous_avail],
+        n_samples=20,
+        seed=5,
+    )
+    t = result.targets[0]
+    # With availability=0, cost_per_token=inf (nonfinite) for every sample
+    assert t.failure_count == 20
+    assert t.mean is None
+    assert t.std is None
+    assert t.p5 is None
+
+
+def test_failure_count_partial_failure():
+    """
+    SYNTHETIC: availability uniform(0.0, 1.0) will include near-zero
+    samples that become nonfinite; expect some failures but not all.
+    Note: This test seeds and checks count is >=0 (structural, not exact).
+    """
+    from gpu_stack.uncertainty import UncertainAssignment, uniform
+    wide_avail = UncertainAssignment(
+        "training.cluster_availability",
+        uniform(0.0, 1.0),
+    )
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[wide_avail],
+        n_samples=50,
+        seed=6,
+    )
+    t = result.targets[0]
+    # failure_count >= 0 (structural invariant)
+    assert t.failure_count >= 0
+    assert t.failure_count <= t.sample_count
+
+
+# ---------------------------------------------------------------------------
+# Result structure and to_dict
+# ---------------------------------------------------------------------------
+
+def test_uncertainty_result_echoes_preset_name_and_seed():
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=10,
+        seed=42,
+    )
+    assert result.preset_name == SYNTHETIC_PRESET.name
+    assert result.n_samples == 10
+    assert result.seed == 42
+
+
+def test_uncertainty_result_seed_none_when_not_supplied():
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=10,
+    )
+    assert result.seed is None
+
+
+def test_uncertainty_result_targets_in_order():
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET, POWER_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=20,
+        seed=1,
+    )
+    assert len(result.targets) == 2
+    assert result.targets[0].label == "cost_per_token"
+    assert result.targets[1].label == "job_dc_power"
+
+
+def test_uncertainty_result_to_dict_shape():
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=10,
+        seed=42,
+    )
+    d = result.to_dict()
+    assert d["preset_name"] == SYNTHETIC_PRESET.name
+    assert d["n_samples"] == 10
+    assert d["seed"] == 42
+    assert "input_specs" in d
+    assert "targets" in d
+    assert "cost_per_token" in d["targets"]
+    t = d["targets"]["cost_per_token"]
+    for key in ("label", "target", "sample_count", "failure_count",
+                "mean", "std", "p5", "p50", "p95", "input_specs"):
+        assert key in t, f"missing key {key!r} in TargetUncertaintyStats dict"
+
+
+def test_target_stats_to_dict_contains_input_specs():
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=10,
+        seed=0,
+    )
+    t_dict = result.targets[0].to_dict()
+    assert isinstance(t_dict["input_specs"], list)
+    assert len(t_dict["input_specs"]) == 1
+    assert t_dict["input_specs"][0]["name"] == "econ.power.price_kwh_peak"
+
+
+def test_uncertainty_result_input_specs_echoed():
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE, UNCERTAIN_AVAIL],
+        n_samples=10,
+        seed=0,
+    )
+    names = [spec.name for spec in result.input_specs]
+    assert "econ.power.price_kwh_peak" in names
+    assert "training.cluster_availability" in names
+
+
+# ---------------------------------------------------------------------------
+# Plain dict assignment input
+# ---------------------------------------------------------------------------
+
+def test_propagate_uncertainty_accepts_plain_dict():
+    """Caller can pass a plain dict instead of a Preset."""
+    base = dict(SYNTHETIC_PRESET.assignments)
+    base_variants = dict(SYNTHETIC_PRESET.variants)
+
+    # We need to pass variants separately - but propagate_uncertainty with a
+    # plain dict will use empty variants. So use a target that doesn't need
+    # variant resolution: job_dc_power.
+    result = propagate_uncertainty(
+        base,
+        [POWER_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=10,
+        seed=0,
+    )
+    assert result.preset_name == "<assignments>"
+    assert result.targets[0].sample_count == 10
+
+
+# ---------------------------------------------------------------------------
+# Normal and lognormal distribution coverage
+# ---------------------------------------------------------------------------
+
+def test_propagate_uncertainty_with_normal_distribution():
+    """Normal distribution over price should give nonzero std and sane mean."""
+    ua = UncertainAssignment("econ.power.price_kwh_peak", SYNTH_PRICE_NORMAL)
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[ua],
+        n_samples=50,
+        seed=13,
+    )
+    t = result.targets[0]
+    assert t.mean is not None
+    assert t.std is not None and t.std > 0
+    assert t.p5 <= t.p50 <= t.p95
+
+
+def test_propagate_uncertainty_with_lognormal_distribution():
+    """Lognormal distribution over price should give nonzero std and sane mean."""
+    ua = UncertainAssignment("econ.power.price_kwh_peak", SYNTH_PRICE_LOGNORMAL)
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[ua],
+        n_samples=50,
+        seed=17,
+    )
+    t = result.targets[0]
+    assert t.mean is not None
+    assert t.std is not None and t.std > 0
+    assert t.p5 <= t.p50 <= t.p95
+
+
+# ---------------------------------------------------------------------------
+# Multi-target run
+# ---------------------------------------------------------------------------
+
+def test_propagate_uncertainty_multi_target_both_resolved():
+    """Both cost_per_token and job_dc_power should resolve with no failures."""
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET, POWER_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=50,
+        seed=8,
+    )
+    assert len(result.targets) == 2
+    for t in result.targets:
+        assert t.failure_count == 0
+        assert t.mean is not None
+
+
+# ---------------------------------------------------------------------------
+# Performance sanity: n_samples=200 should be fast via lambdify path
+# ---------------------------------------------------------------------------
+
+def test_performance_200_samples_reasonable_time():
+    """
+    200 samples on the dense fixture should complete in a few seconds via
+    the lambdify fast path. This test fails if it takes more than 30 seconds
+    (a sign the fallback per-sample path is being used unexpectedly).
+    """
+    import time
+    start = time.monotonic()
+    result = propagate_uncertainty(
+        SYNTHETIC_PRESET,
+        [COST_TARGET],
+        uncertain=[UNCERTAIN_PRICE],
+        n_samples=200,
+        seed=0,
+    )
+    elapsed = time.monotonic() - start
+    assert elapsed < 30.0, f"200 samples took {elapsed:.1f}s (expected < 30s via lambdify)"
+    assert result.targets[0].mean is not None