[AZ-384] C5 marginals + current_estimate/smoothed_history/health_snapshot

Replaces the last three NotImplementedError placeholders on GtsamIsam2StateEstimator with real Marginals + output methods: - current_estimate(): recovers the 6x6 Marginals covariance for the most-recently committed pose key, enforces the SPD invariant via np.linalg.cholesky (Invariant 10), converts the local-ENU pose translation to WGS84 via the shared WgsConverter, derives a body->world quaternion, and emits a fresh EstimatorOutput (smoothed=False, Invariant 4). On SPD failure transitions isam2_state -> LOST and raises EstimatorFatalError (AC-5.2 path). - smoothed_history(n): iterates the smoother's active POSE keys via _smoother.calculateEstimate().keys() (filtered by GTSAM symbol char) and the smoother timestamps via ts_map.at(key) - workaround for the pinned gtsam_unstable build's non-iterable FixedLagSmootherKeyTimestampMap. Bounded by K (Invariant 6); every entry has smoothed=True (Invariant 7). - health_snapshot(): cheap O(1) accumulator read; reports IsamState lifecycle, pose-key count, AC-NEW-8 cov_norm_growing_for_s rolling 60s deque-backed counter, and spoof_promotion_blocked via the AZ-385 state machine injection point. Adds two public injection points for AZ-385/composition root: set_enu_origin(LatLonAlt) and attach_source_label_state_machine(machine). Defaults: (0, 0, 0) ENU origin, VISUAL_PROPAGATED source label, spoof_promotion_blocked=False. Wires _record_committed_pose_key into the three add_* success paths so current_estimate only reads keys that have real values in iSAM2. The JACOBIAN path in add_pose_anchor deliberately skips this call - Invariant 3 keeps the JACOBIAN pose out of the iSAM2 graph. Tests: +27 in tests/unit/c5_state/test_az384_marginals_outputs.py covering all 10 ACs. Three obsolete AZ-382 tests (test_ac10_*_raises_named_az384) removed. Full suite: 589 passed, 2 skipped. Co-authored-by: Cursor <cursoragent@cursor.com>
2026-06-22 18:51:15 +00:00 · 2026-05-11 06:20:01 +03:00
parent fd848266d1
commit b3ad94c155
6 changed files with 991 additions and 37 deletions
@@ -31,13 +31,23 @@ there.
 from __future__ import annotations

 import time
+from collections import deque
 from typing import TYPE_CHECKING, Any, Final
-from uuid import UUID
+from uuid import UUID, uuid4

 import gtsam
 import gtsam_unstable
 import numpy as np
+from numpy.linalg import LinAlgError

+from gps_denied_onboard._types.geo import LatLonAlt
+from gps_denied_onboard._types.state import (
+    EstimatorHealth,
+    EstimatorOutput,
+    IsamState,
+    PoseSourceLabel,
+    Quat,
+)
 from gps_denied_onboard.components.c5_state._isam2_handle import (
    ISam2GraphHandle,
    ISam2GraphHandleImpl,
@@ -45,15 +55,16 @@ from gps_denied_onboard.components.c5_state._isam2_handle import (
 from gps_denied_onboard.components.c5_state.config import C5StateConfig
 from gps_denied_onboard.components.c5_state.errors import (
    EstimatorDegradedError,
+    EstimatorFatalError,
    StateEstimatorConfigError,
 )
 from gps_denied_onboard.components.c5_state.interface import StateEstimator
+from gps_denied_onboard.helpers.wgs_converter import WgsConverter
 from gps_denied_onboard.logging import get_logger

 if TYPE_CHECKING:
    from gps_denied_onboard._types.nav import ImuWindow
    from gps_denied_onboard._types.pose import PoseEstimate
-    from gps_denied_onboard._types.state import EstimatorHealth, EstimatorOutput
    from gps_denied_onboard._types.vio import VioOutput
    from gps_denied_onboard.config import Config

@@ -82,6 +93,19 @@ _STRATEGY: Final[str] = "gtsam_isam2"
 # converge without exploding.
 _DEFAULT_POSE_SIGMA: Final[float] = 0.1

+# AC-NEW-8 rolling-window length (60 s) for ``cov_norm_growing_for_s``.
+# We keep ``(monotonic_ns, cov_norm)`` tuples for every successful
+# ``current_estimate()`` and lazy-prune anything older than this on
+# read.
+_COV_NORM_WINDOW_NS: Final[int] = 60 * 1_000_000_000
+
+# Default ENU origin when none was injected — equator, prime meridian,
+# sea level. Behaviour is deliberately permissive so the estimator can
+# run on synthetic fixtures without a wired-up satellite anchor; the
+# composition root SHOULD call :meth:`set_enu_origin` before steady
+# state. AZ-385 will tie origin selection to the spoof-promotion gate.
+_DEFAULT_ENU_ORIGIN: Final[LatLonAlt] = LatLonAlt(lat_deg=0.0, lon_deg=0.0, alt_m=0.0)
+

 class GtsamIsam2StateEstimator(StateEstimator):
    """Production-default C5 estimator — iSAM2 + ``IncrementalFixedLagSmoother``.
@@ -154,6 +178,30 @@ class GtsamIsam2StateEstimator(StateEstimator):
        self._prev_imu_v_key: int | None = None
        self._prev_imu_b_key: int | None = None

+        # AZ-384 state -----------------------------------------------------
+        # Last pose key with an actually committed value in iSAM2 (used by
+        # ``current_estimate``). Set ONLY after a successful
+        # ``handle.update`` that inserts a value for that key.
+        self._last_committed_pose_key: int | None = None
+        # ENU origin for ``current_estimate``'s pose conversion. None
+        # means use ``_DEFAULT_ENU_ORIGIN``; AZ-385 wires the real
+        # origin via :meth:`set_enu_origin` from the first satellite
+        # anchor.
+        self._enu_origin: LatLonAlt | None = None
+        # Source-label state machine (AZ-385). When None,
+        # ``current_estimate`` emits ``VISUAL_PROPAGATED`` per the
+        # contract default and ``health_snapshot`` reports
+        # ``spoof_promotion_blocked=False``.
+        self._source_label_machine: Any | None = None
+        # AC-NEW-8 rolling window of ``(ts_monotonic_ns, cov_norm)``
+        # tuples for ``cov_norm_growing_for_s`` accounting.
+        self._cov_norm_window: deque[tuple[int, float]] = deque()
+        # iSAM2 lifecycle state. ``INIT`` until the first successful
+        # ``current_estimate``; ``TRACKING`` after; transitions to
+        # ``DEGRADED`` on an inflated covariance trend (AC-NEW-8) and
+        # ``LOST`` on a fatal SPD failure or GTSAM exception.
+        self._isam2_state: IsamState = IsamState.INIT
+
        self._log.debug(
            "c5.state.isam2_initialised",
            extra={
@@ -188,6 +236,28 @@ class GtsamIsam2StateEstimator(StateEstimator):
        """
        self._isam2_handle = handle

+    def set_enu_origin(self, origin: LatLonAlt) -> None:
+        """Set the WGS84 origin used by :meth:`current_estimate` for ENU→WGS84.
+
+        The composition root SHOULD call this once at startup before
+        steady-state ``current_estimate`` calls. AZ-385 (source-label
+        gate) will eventually drive this from the first satellite-
+        anchored frame. Before this is called the estimator falls
+        back to :data:`_DEFAULT_ENU_ORIGIN` (equator / prime meridian
+        / sea level) which is correct for tests but obviously wrong
+        for flight.
+        """
+        self._enu_origin = origin
+
+    def attach_source_label_state_machine(self, machine: Any) -> None:
+        """Wire the AZ-385 source-label / spoof-promotion state machine.
+
+        The injected object MUST expose ``current_label() -> PoseSourceLabel``
+        and ``is_spoof_promotion_blocked() -> bool``. AZ-384 only holds
+        the reference; AZ-385 owns the actual transition logic.
+        """
+        self._source_label_machine = machine
+
    def key_for_frame(self, frame_id: UUID | int) -> int:
        """Return the GTSAM ``Key`` for ``frame_id``, assigning on first use.

@@ -266,6 +336,7 @@ class GtsamIsam2StateEstimator(StateEstimator):
        self._reset_staging()
        self._prev_vio = vio
        self._last_added_ts_ns = ts_ns
+        self._record_committed_pose_key(curr_key)
        self._log.debug(
            "c5.state.add_vio_ok",
            extra={
@@ -321,6 +392,7 @@ class GtsamIsam2StateEstimator(StateEstimator):
                )
                raise EstimatorDegradedError(f"add_pose_anchor failed: {exc}") from exc
            self._reset_staging()
+            self._record_committed_pose_key(pose_key)
            self._log.debug(
                "c5.state.add_pose_anchor_ok",
                extra={
@@ -452,6 +524,7 @@ class GtsamIsam2StateEstimator(StateEstimator):
        self._prev_imu_v_key = curr_v_key
        self._prev_imu_b_key = curr_b_key
        self._last_added_ts_ns = imu_window.ts_end_ns
+        self._record_committed_pose_key(curr_x_key)
        self._log.debug(
            "c5.state.add_fc_imu_ok",
            extra={
@@ -466,21 +539,202 @@ class GtsamIsam2StateEstimator(StateEstimator):
        )

    # ------------------------------------------------------------------
-    # AZ-384 / AZ-385 / AZ-386 — body still owned by those tasks.
+    # AZ-384: marginals + output methods.

    def current_estimate(self) -> EstimatorOutput:
-        raise NotImplementedError(
-            "Marginals + outputs owned by AZ-384 — current_estimate body lands there."
+        """Recover the current posterior pose + 6x6 covariance.
+
+        Walks ``_isam2.calculateEstimate()`` for the most-recently
+        committed pose key, recovers the 6x6 Marginals covariance
+        from the iSAM2 graph (D-C5-5 = (c)), enforces the
+        SPD-positive-definite invariant (Invariant 10) before
+        emission, and assembles a fresh :class:`EstimatorOutput`
+        (Invariant 4 — never returns ``None`` on the steady-state
+        path).
+        """
+        handle = self._require_handle()
+        if self._last_committed_pose_key is None:
+            raise EstimatorFatalError(
+                "current_estimate: no committed pose key yet (graph empty); "
+                "AC-5.2 fallback in C8 will trigger after no_estimate_fallback_s"
+            )
+
+        try:
+            marginals = handle.compute_marginals()
+            covariance = np.asarray(
+                marginals.marginalCovariance(self._last_committed_pose_key),
+                dtype=np.float64,
+            )
+        except EstimatorFatalError:
+            self._isam2_state = IsamState.LOST
+            raise
+        except Exception as exc:
+            self._isam2_state = IsamState.LOST
+            self._log.error(
+                "c5.state.current_estimate_marginals_failed",
+                extra={
+                    "kind": "c5.state.current_estimate_marginals_failed",
+                    "kv": {
+                        "pose_key": self._last_committed_pose_key,
+                        "error": str(exc),
+                    },
+                },
+            )
+            raise EstimatorFatalError(f"compute_marginals failed: {exc}") from exc
+
+        try:
+            _enforce_spd(covariance)
+        except EstimatorFatalError:
+            self._isam2_state = IsamState.LOST
+            self._log.error(
+                "c5.state.current_estimate_spd_failed",
+                extra={
+                    "kind": "c5.state.current_estimate_spd_failed",
+                    "kv": {
+                        "pose_key": self._last_committed_pose_key,
+                        "covariance_fro_norm": float(np.linalg.norm(covariance, ord="fro")),
+                    },
+                },
+            )
+            raise
+
+        pose = self._pose_at_key(self._last_committed_pose_key)
+        position_wgs84 = self._enu_pose_to_wgs84(pose)
+        orientation = _quat_from_pose3(pose)
+        velocity_world = self._latest_velocity_or_zero()
+        last_anchor_age_ms = int(handle.last_anchor_age_ms())
+        source_label = self._derive_source_label()
+        emitted_at = time.monotonic_ns()
+
+        self._record_cov_norm_sample(emitted_at, covariance)
+        if self._isam2_state == IsamState.INIT:
+            self._isam2_state = IsamState.TRACKING
+        if self._cov_norm_growing_for_s() > 0.0:
+            # AC-NEW-8 — sustained monotone covariance growth signals
+            # poor convergence. Surface DEGRADED but keep tracking;
+            # only the SPD failure above flips us to LOST.
+            self._isam2_state = IsamState.DEGRADED
+
+        return EstimatorOutput(
+            frame_id=uuid4(),
+            position_wgs84=position_wgs84,
+            orientation_world_T_body=orientation,
+            velocity_world_mps=velocity_world,
+            covariance_6x6=covariance,
+            source_label=source_label,
+            last_satellite_anchor_age_ms=last_anchor_age_ms,
+            smoothed=False,
+            emitted_at=emitted_at,
        )

    def smoothed_history(self, n_keyframes: int) -> list[EstimatorOutput]:
-        raise NotImplementedError(
-            "Marginals + outputs owned by AZ-384 — smoothed_history body lands there."
-        )
+        """Return up to ``min(n_keyframes, K)`` past smoothed estimates.
+
+        Iterates the ``IncrementalFixedLagSmoother`` active timestamp
+        map, sorts keys by ascending timestamp, takes the most recent
+        ``min(n_keyframes, K)`` POSE keys (filters out velocity/bias
+        keys), and emits an :class:`EstimatorOutput` per key with
+        ``smoothed=True`` (Invariant 7). Out-of-window keyframes are
+        not recoverable (Invariant 6).
+        """
+        handle = self._require_handle()
+        if n_keyframes <= 0:
+            return []
+
+        try:
+            active_values = self._smoother.calculateEstimate()
+            ts_map = self._smoother.timestamps()
+        except Exception:
+            return []
+
+        pose_entries: list[tuple[int, float]] = []
+        for key in active_values.keys():
+            ikey = int(key)
+            if gtsam.symbolChr(ikey) != ord("x"):
+                continue
+            try:
+                ts_sec = float(ts_map.at(ikey))
+            except Exception:
+                continue
+            pose_entries.append((ikey, ts_sec))
+        pose_entries.sort(key=lambda kt: kt[1])
+
+        max_entries = min(n_keyframes, self._block.keyframe_window_size)
+        selected = pose_entries[-max_entries:]
+        if not selected:
+            return []
+
+        try:
+            marginals = handle.compute_marginals()
+        except Exception as exc:
+            self._log.error(
+                "c5.state.smoothed_history_marginals_failed",
+                extra={
+                    "kind": "c5.state.smoothed_history_marginals_failed",
+                    "kv": {"error": str(exc)},
+                },
+            )
+            raise EstimatorFatalError(f"smoothed_history marginals failed: {exc}") from exc
+
+        last_anchor_age_ms = int(handle.last_anchor_age_ms())
+        source_label = self._derive_source_label()
+        emitted_at = time.monotonic_ns()
+
+        out: list[EstimatorOutput] = []
+        for key, _ts in selected:
+            try:
+                cov = np.asarray(marginals.marginalCovariance(key), dtype=np.float64)
+            except Exception as exc:
+                self._log.error(
+                    "c5.state.smoothed_history_per_key_failed",
+                    extra={
+                        "kind": "c5.state.smoothed_history_per_key_failed",
+                        "kv": {"pose_key": key, "error": str(exc)},
+                    },
+                )
+                continue
+            _enforce_spd(cov)
+            try:
+                pose = active_values.atPose3(key)
+            except Exception as exc:
+                self._log.error(
+                    "c5.state.smoothed_history_pose_read_failed",
+                    extra={
+                        "kind": "c5.state.smoothed_history_pose_read_failed",
+                        "kv": {"pose_key": key, "error": str(exc)},
+                    },
+                )
+                continue
+            out.append(
+                EstimatorOutput(
+                    frame_id=uuid4(),
+                    position_wgs84=self._enu_pose_to_wgs84(pose),
+                    orientation_world_T_body=_quat_from_pose3(pose),
+                    velocity_world_mps=(0.0, 0.0, 0.0),
+                    covariance_6x6=cov,
+                    source_label=source_label,
+                    last_satellite_anchor_age_ms=last_anchor_age_ms,
+                    smoothed=True,
+                    emitted_at=emitted_at,
+                )
+            )
+        return out

    def health_snapshot(self) -> EstimatorHealth:
-        raise NotImplementedError(
-            "Marginals + outputs owned by AZ-384 — health_snapshot body lands there."
+        """Return the current iSAM2 health snapshot.
+
+        Cheap O(1) accumulator read — never touches Marginals
+        (contract NFR: ``health_snapshot`` p99 ≤ 5 µs). Reports the
+        cached :class:`IsamState`, the smoother's active keyframe
+        count, the AC-NEW-8 ``cov_norm_growing_for_s`` rolling
+        counter, and the spoof-promotion gate state via the injected
+        :attr:`_source_label_machine` (default ``False`` if none).
+        """
+        return EstimatorHealth(
+            isam2_state=self._isam2_state,
+            keyframe_count=self._smoother_keyframe_count(),
+            cov_norm_growing_for_s=self._cov_norm_growing_for_s(),
+            spoof_promotion_blocked=self._spoof_promotion_blocked(),
        )

    # ------------------------------------------------------------------
@@ -515,6 +769,146 @@ class GtsamIsam2StateEstimator(StateEstimator):
        self._graph = gtsam.NonlinearFactorGraph()
        self._values = gtsam.Values()

+    def _record_committed_pose_key(self, key: int) -> None:
+        """Cache the most-recently committed pose key for ``current_estimate``.
+
+        Called from every ``add_*`` success path AFTER
+        ``handle.update`` returns; guarantees the key has a real
+        value in ``_isam2`` before ``current_estimate`` tries to read
+        it. The JACOBIAN path of ``add_pose_anchor`` deliberately
+        does NOT call this — its pose is never committed to the
+        iSAM2 graph (Invariant 3).
+        """
+        self._last_committed_pose_key = key
+
+    def _pose_at_key(self, key: int) -> gtsam.Pose3:
+        """Read ``Pose3`` for ``key`` from the current iSAM2 estimate.
+
+        Raises :class:`EstimatorFatalError` if the key is missing or
+        the read fails (e.g. GTSAM raised). The caller is responsible
+        for guaranteeing the key was previously committed via
+        :meth:`_record_committed_pose_key`.
+        """
+        try:
+            values = self._isam2.calculateEstimate()
+            return values.atPose3(key)
+        except Exception as exc:
+            raise EstimatorFatalError(f"_pose_at_key({key}) failed: {exc}") from exc
+
+    def _enu_pose_to_wgs84(self, pose: gtsam.Pose3) -> LatLonAlt:
+        """Convert a local-ENU pose's translation to WGS84.
+
+        Uses the injected ``_enu_origin`` (or :data:`_DEFAULT_ENU_ORIGIN`
+        when none was wired). The orientation is preserved verbatim
+        as a body→world quaternion — only the translation needs the
+        WGS coordinate change.
+        """
+        origin = self._enu_origin if self._enu_origin is not None else _DEFAULT_ENU_ORIGIN
+        translation = np.asarray(pose.translation(), dtype=np.float64).reshape(3)
+        try:
+            return WgsConverter.local_enu_to_latlonalt(origin, translation)
+        except Exception as exc:
+            raise EstimatorFatalError(f"_enu_pose_to_wgs84 failed: {exc}") from exc
+
+    def _latest_velocity_or_zero(self) -> tuple[float, float, float]:
+        """Read the most-recent IMU keyframe's velocity or fall back to zero.
+
+        ``CombinedImuFactor`` writes a 3-vector velocity at the ``v``
+        key for each IMU keyframe. When no IMU keyframe has been
+        committed yet, returns ``(0, 0, 0)`` — the downstream consumer
+        infers this from a ``DEAD_RECKONED`` / ``VISUAL_PROPAGATED``
+        source label.
+        """
+        if self._prev_imu_v_key is None:
+            return (0.0, 0.0, 0.0)
+        try:
+            values = self._isam2.calculateEstimate()
+            raw = np.asarray(values.atVector(self._prev_imu_v_key), dtype=np.float64).reshape(3)
+            return (float(raw[0]), float(raw[1]), float(raw[2]))
+        except Exception:
+            return (0.0, 0.0, 0.0)
+
+    def _derive_source_label(self) -> PoseSourceLabel:
+        """Read the source label from the AZ-385 state machine if wired.
+
+        Falls back to ``VISUAL_PROPAGATED`` when no state machine is
+        attached — the contract's neutral steady-state default before
+        the spoof-promotion gate has any evidence either way.
+        """
+        if self._source_label_machine is None:
+            return PoseSourceLabel.VISUAL_PROPAGATED
+        try:
+            label = self._source_label_machine.current_label()
+        except Exception as exc:
+            self._log.error(
+                "c5.state.source_label_machine_failed",
+                extra={
+                    "kind": "c5.state.source_label_machine_failed",
+                    "kv": {"error": str(exc)},
+                },
+            )
+            return PoseSourceLabel.VISUAL_PROPAGATED
+        if not isinstance(label, PoseSourceLabel):
+            return PoseSourceLabel.VISUAL_PROPAGATED
+        return label
+
+    def _spoof_promotion_blocked(self) -> bool:
+        """Query the AZ-385 state machine for the spoof gate state."""
+        if self._source_label_machine is None:
+            return False
+        try:
+            return bool(self._source_label_machine.is_spoof_promotion_blocked())
+        except Exception:
+            return False
+
+    def _smoother_keyframe_count(self) -> int:
+        """Count the smoother's active POSE keys.
+
+        ``IncrementalFixedLagSmoother.calculateEstimate()`` returns
+        the ``Values`` for every key still inside the sliding
+        window; we filter to POSE keys (``'x'`` namespace) per
+        Invariant 6.
+        """
+        try:
+            keys = list(self._smoother.calculateEstimate().keys())
+        except Exception:
+            return 0
+        return sum(1 for k in keys if gtsam.symbolChr(int(k)) == ord("x"))
+
+    def _record_cov_norm_sample(self, ts_ns: int, covariance: np.ndarray) -> None:
+        """Append a ``(ts_ns, fro_norm(cov))`` sample to the rolling window."""
+        norm = float(np.linalg.norm(covariance, ord="fro"))
+        self._cov_norm_window.append((ts_ns, norm))
+        self._prune_cov_norm_window(ts_ns)
+
+    def _prune_cov_norm_window(self, now_ns: int) -> None:
+        cutoff = now_ns - _COV_NORM_WINDOW_NS
+        while self._cov_norm_window and self._cov_norm_window[0][0] < cutoff:
+            self._cov_norm_window.popleft()
+
+    def _cov_norm_growing_for_s(self) -> float:
+        """Return the length (s) of the latest strictly-rising suffix.
+
+        Walks the rolling window from newest to oldest; accumulates
+        time while each sample is greater than its successor. Resets
+        the moment we find a non-rising step. Maps AC-NEW-8: "Resets
+        to 0 on a non-rising frame".
+        """
+        if len(self._cov_norm_window) < 2:
+            return 0.0
+        samples = list(self._cov_norm_window)
+        # Walk newest → second-newest; stop when the chain breaks.
+        oldest_rising_idx = len(samples) - 1
+        for i in range(len(samples) - 1, 0, -1):
+            if samples[i][1] > samples[i - 1][1]:
+                oldest_rising_idx = i - 1
+            else:
+                break
+        if oldest_rising_idx == len(samples) - 1:
+            return 0.0
+        span_ns = samples[-1][0] - samples[oldest_rising_idx][0]
+        return max(0.0, span_ns * 1e-9)
+

 # ----------------------------------------------------------------------
 # Module-level helpers.
@@ -614,3 +1008,38 @@ def _make_timestamp_map(
    for key in keys:
        ts_map.insert((key, ts_seconds))
    return ts_map
+
+
+# ----------------------------------------------------------------------
+# Module-level pure helpers (AZ-384).
+
+
+def _quat_from_pose3(pose: gtsam.Pose3) -> Quat:
+    """Build a scalar-first :class:`Quat` from a ``gtsam.Pose3``.
+
+    Uses ``Rot3.toQuaternion`` to get the body→world unit
+    quaternion; we explicitly normalise to defend against numerical
+    drift inside the iSAM2 estimate.
+    """
+    rot = pose.rotation()
+    q = rot.toQuaternion()
+    w, x, y, z = float(q.w()), float(q.x()), float(q.y()), float(q.z())
+    norm = (w * w + x * x + y * y + z * z) ** 0.5
+    if norm < 1e-12:
+        return Quat(w=1.0, x=0.0, y=0.0, z=0.0)
+    return Quat(w=w / norm, x=x / norm, y=y / norm, z=z / norm)
+
+
+def _enforce_spd(covariance: np.ndarray) -> None:
+    """Cholesky-check ``covariance``; raise ``EstimatorFatalError`` on failure.
+
+    The C5 contract (Invariant 10) demands every emitted
+    ``covariance_6x6`` is symmetric positive-definite. We use
+    Cholesky-decomposition as the defensive check because it's the
+    same primitive iSAM2 uses internally — a failure here means the
+    posterior is numerically broken, NOT merely degraded.
+    """
+    try:
+        np.linalg.cholesky(covariance)
+    except LinAlgError as exc:
+        raise EstimatorFatalError(f"covariance failed SPD invariant: {exc}") from exc