mirror of
https://github.com/azaion/gps-denied-onboard.git
synced 2026-06-21 14:31:12 +00:00
59d9116d36
Bootstraps the public-boundary blackbox test harness owned by epic
AZ-262 (E-BBT). Establishes the e2e/ directory tree at the repo root,
fully separated from src/gps_denied_onboard/** and from the in-process
tests/** tree, and commits to the contracts every subsequent test
ticket (AZ-407..AZ-446) builds against.
Tier-1 (workstation Docker):
- docker/docker-compose.test.yml wires SUT + ArduPilot SITL + iNav SITL
+ mock Suite Sat Service + mavproxy listener + e2e-runner onto one
e2e-net bridge with internal: true (enforces RESTRICT-SAT-1 /
NFT-SEC-02 egress isolation at the network layer).
- docker/docker-compose.tier2-bridge.yml override disables the in-
compose SUT so Tier-2 pairs SITLs + mock + runner on an x86 host
while the SUT runs natively on the Jetson under systemd.
Tier-2 (Jetson):
- jetson/run-tier2.sh + tier2.service systemd unit + tegrastats /
jtop parsers feed per-sample telemetry into the evidence bundle.
Runner image (e2e/runner/):
- Dockerfile + requirements.txt install ONLY ground-side libs
(pymavlink, opencv-python>=4.12, numpy/scipy/geopy/pyproj, httpx,
orjson, pydantic, structlog, pytest 8.x). The runner deliberately
does NOT install the SUT package.
- conftest.py implements the AC-9 skip-rule mapping (tier2_only,
chamber_only, vins_mono, deferred_ac) tied to environment.md
parametrize axes.
- reporting/csv_reporter.py is a pytest plugin emitting one row per
test with the exact 11-column schema from environment.md §
Reporting (test_id, test_name, traces_to, fc_adapter, vio_strategy,
tier, started_at_utc, execution_time_ms, result, error_message,
evidence_paths). XFAIL surfaced only when a test carries
@pytest.mark.deferred_ac(verdict="xfail", reason=...).
- reporting/evidence_bundler.py exposes the attach_evidence fixture
that copies per-test artifacts (.tlog, FDR archives, screenshots,
tegrastats / jtop CSVs) into the run bundle and records relative
paths into the reporter's evidence_paths column.
- helpers/{frame_source_replay,imu_replay,sitl_observer,
mavproxy_tlog_reader,fdr_reader}.py declare the public surfaces
(concrete implementations owned by AZ-407 / AZ-408 / AZ-416 /
AZ-417 / AZ-441 per the dependency table); helpers/geo.py ships
today (no downstream task dep) — WGS84 distance / forward-bearing
/ offset via pyproj with NaN rejection.
Mock Suite Sat Service (e2e/fixtures/mock-suite-sat/):
- FastAPI app: POST /tiles (ingest contract from D-PROJ-2 follow-up),
GET /tiles/audit + /mock/audit (per-run read-back), POST
/mock/config (force-status, response delay), POST /mock/reset
(clears audit between tests), GET /mock/health.
Fixture scaffolds (e2e/fixtures/{tile-cache-builder, age-injector,
injectors, cold-boot, secrets, security}/):
- Public surfaces only. Concrete builders land in AZ-407 (static
fixtures), AZ-408 (runtime synthetic injection), AZ-419 (cold-boot
fixture), AZ-439 (CVE-2025-53644 JPEG generator).
Test tree (e2e/tests/{positive,negative,performance,resilience,
security,resource_limit}/):
- Mirror of the test-spec category grouping in
_docs/02_document/tests/*-tests.md.
- tests/positive/test_smoke.py is the AC-1 harness-boot smoke run
inside the e2e-runner image once Docker brings everything up.
Out-of-container unit tests (e2e/_unit_tests/):
- Exercises the harness internals (CSV reporter plugin lifecycle,
conftest skip rules, helper modules, parsers, mock app, compose
YAML structural contract, public-boundary enforcement) without
Docker / SITL. 97 unit tests, all passing.
Build / config:
- pyproject.toml: testpaths extended with e2e/_unit_tests; pythonpath
extended with e2e; fastapi>=0.111,<0.120 added to dev extras for the
mock-app TestClient unit test.
AC coverage:
- AC-1 (Tier-1 boot) → compose YAML test + directory layout
+ smoke test (Docker-bound)
- AC-2 (mock services) → 6 FastAPI TestClient unit tests
- AC-3 (SITLs accept output) → contract present; concrete check
deferred to AZ-416 / AZ-417
- AC-4 (CSV columns) → in-process plugin lifecycle test
emits the exact 11-column schema
- AC-5 (egress isolation) → static config test + runtime probe
in Docker-bound smoke
- AC-6 (Tier-2 contract) → tegrastats + jtop parser unit tests
+ jetson/* layout test; full Tier-2
contract is AZ-444
- AC-7 (fixture reproducibility) → deferred to AZ-407 per task spec
- AC-8 (parametrize matrix) → vins_mono skip-rule cases +
tests/positive/test_smoke
- AC-9 (skip semantics) → 9 conftest skip-rule unit tests
Module layout entry for blackbox_tests was added in 2026-05-16
preparatory commit d7a17a8 so this diff stays focused on the harness
scaffold. AZ-406 advances to In Testing on commit.
Co-authored-by: Cursor <cursoragent@cursor.com>
145 lines
5.5 KiB
Python
145 lines
5.5 KiB
Python
"""Unit tests for the runner conftest's skip / xfail enforcement.
|
|
|
|
We exercise `pytest_collection_modifyitems` directly with a fake config and
|
|
a synthetic item list, then assert the post-conditions (marker added, etc.).
|
|
|
|
This catches regressions where someone changes the skip rules without
|
|
updating the traceability matrix — see
|
|
`_docs/02_document/tests/traceability-matrix.md` § Uncovered Items Analysis.
|
|
"""
|
|
|
|
from __future__ import annotations
|
|
|
|
import sys
|
|
from pathlib import Path
|
|
from types import SimpleNamespace
|
|
|
|
import pytest
|
|
|
|
_E2E_ROOT = Path(__file__).resolve().parents[1]
|
|
if str(_E2E_ROOT) not in sys.path:
|
|
sys.path.insert(0, str(_E2E_ROOT))
|
|
|
|
from runner.conftest import pytest_collection_modifyitems # noqa: E402
|
|
|
|
|
|
class _Marker(SimpleNamespace):
|
|
pass
|
|
|
|
|
|
class _FakeKeywords(set):
|
|
"""Mimic pytest.Item.keywords (a set-with-`in` semantics over marker names)."""
|
|
|
|
|
|
class _FakeItem:
|
|
def __init__(
|
|
self,
|
|
keywords: set[str] | None = None,
|
|
markers: dict[str, _Marker] | None = None,
|
|
callspec: SimpleNamespace | None = None,
|
|
) -> None:
|
|
self.keywords = _FakeKeywords(keywords or set())
|
|
self._markers = markers or {}
|
|
self.callspec = callspec
|
|
self.added_markers: list[_Marker] = []
|
|
|
|
def get_closest_marker(self, name: str) -> _Marker | None:
|
|
return self._markers.get(name)
|
|
|
|
def add_marker(self, marker: _Marker) -> None:
|
|
self.added_markers.append(marker)
|
|
|
|
|
|
class _FakeConfig:
|
|
def __init__(self, chamber: bool = False, build_kind: str = "production", allow_no_reason: bool = False) -> None:
|
|
self._chamber = chamber
|
|
self._build_kind = build_kind
|
|
self._allow_no_reason = allow_no_reason
|
|
|
|
def getoption(self, name: str) -> object:
|
|
return {
|
|
"--enable-chamber": self._chamber,
|
|
"--build-kind": self._build_kind,
|
|
"--allow-no-skip-reason": self._allow_no_reason,
|
|
}[name]
|
|
|
|
|
|
def _skip_reasons(item: _FakeItem) -> list[str]:
|
|
out: list[str] = []
|
|
for m in item.added_markers:
|
|
# pytest.mark.skip(reason=...) returns a MarkDecorator with .mark.kwargs;
|
|
# in our shim we have a SimpleNamespace from pytest.mark.skip itself.
|
|
# Easiest: stringify and look for the reason inside.
|
|
out.append(str(m))
|
|
return out
|
|
|
|
|
|
def test_tier2_only_skipped_on_tier1(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
monkeypatch.setenv("TIER", "tier1-docker")
|
|
item = _FakeItem(keywords={"tier2_only"})
|
|
pytest_collection_modifyitems(_FakeConfig(), [item])
|
|
assert any("Tier-2 only" in r for r in _skip_reasons(item))
|
|
|
|
|
|
def test_tier2_only_runs_on_tier2(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
monkeypatch.setenv("TIER", "tier2-jetson")
|
|
item = _FakeItem(keywords={"tier2_only"})
|
|
pytest_collection_modifyitems(_FakeConfig(), [item])
|
|
assert not item.added_markers, "tier2_only test should run when TIER=tier2-jetson"
|
|
|
|
|
|
def test_chamber_only_skipped_without_flag(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
monkeypatch.setenv("TIER", "tier2-jetson")
|
|
item = _FakeItem(keywords={"chamber_only"})
|
|
pytest_collection_modifyitems(_FakeConfig(chamber=False), [item])
|
|
assert any("Chamber" in r for r in _skip_reasons(item))
|
|
|
|
|
|
def test_chamber_only_runs_with_flag(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
monkeypatch.setenv("TIER", "tier2-jetson")
|
|
item = _FakeItem(keywords={"chamber_only"})
|
|
pytest_collection_modifyitems(_FakeConfig(chamber=True), [item])
|
|
assert not item.added_markers, "chamber_only test should run with --enable-chamber"
|
|
|
|
|
|
def test_vins_mono_skipped_on_production(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
monkeypatch.setenv("TIER", "tier1-docker")
|
|
callspec = SimpleNamespace(params={"vio_strategy": "vins_mono"})
|
|
item = _FakeItem(callspec=callspec)
|
|
pytest_collection_modifyitems(_FakeConfig(build_kind="production"), [item])
|
|
assert any("research-build-only" in r for r in _skip_reasons(item))
|
|
|
|
|
|
def test_vins_mono_runs_on_research(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
monkeypatch.setenv("TIER", "tier1-docker")
|
|
callspec = SimpleNamespace(params={"vio_strategy": "vins_mono"})
|
|
item = _FakeItem(callspec=callspec)
|
|
pytest_collection_modifyitems(_FakeConfig(build_kind="research"), [item])
|
|
assert not item.added_markers, "vins_mono should run on research builds"
|
|
|
|
|
|
def test_deferred_ac_without_reason_blocks_collection(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
monkeypatch.setenv("TIER", "tier1-docker")
|
|
marker = _Marker(args=(), kwargs={})
|
|
item = _FakeItem(markers={"deferred_ac": marker})
|
|
pytest_collection_modifyitems(_FakeConfig(allow_no_reason=False), [item])
|
|
assert any("without reason=" in r for r in _skip_reasons(item))
|
|
|
|
|
|
def test_deferred_ac_with_reason_emits_skip(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
monkeypatch.setenv("TIER", "tier1-docker")
|
|
marker = _Marker(args=(), kwargs={"reason": "AC-7.1 — see traceability matrix"})
|
|
item = _FakeItem(markers={"deferred_ac": marker})
|
|
pytest_collection_modifyitems(_FakeConfig(), [item])
|
|
assert any("AC-7.1" in r for r in _skip_reasons(item))
|
|
|
|
|
|
def test_deferred_ac_xfail_verdict_emits_xfail(monkeypatch: pytest.MonkeyPatch) -> None:
|
|
monkeypatch.setenv("TIER", "tier1-docker")
|
|
marker = _Marker(args=(), kwargs={"reason": "AC-8.6 scene-change PARTIAL", "verdict": "xfail"})
|
|
item = _FakeItem(markers={"deferred_ac": marker})
|
|
pytest_collection_modifyitems(_FakeConfig(), [item])
|
|
# The xfail decorator object stringifies differently from skip; just
|
|
# verify some marker was added.
|
|
assert item.added_markers, "deferred_ac(verdict=xfail) must mark the item"
|