central/tests/test_consumer_doc.py
2026-06-06 14:44:00 -06:00

145 lines
5.7 KiB
Python

"""Consistency tests for docs/CONSUMER-INTEGRATION.md.
The doc is the consumer contract. These tests catch drift between the doc and
the live code:
- Every StreamEntry in src/central/streams.py must appear in the doc's
"Stream layout" table — and vice versa.
- Every adapter discovered via central.adapter_discovery.discover_adapters()
must have a per-adapter subsection (### <name>) in the doc — and vice versa.
The doc's subject patterns and per-adapter copy are NOT directly asserted (they
are operator-readable prose, not machine-parsable); the registry-level checks
guard against the most common drift (adding a stream / adapter and forgetting
to document it).
"""
import re
from pathlib import Path
from central.adapter_discovery import discover_adapters
from central.streams import STREAMS
DOC_PATH = Path(__file__).resolve().parents[1] / "docs" / "CONSUMER-INTEGRATION.md"
def _doc_text() -> str:
assert DOC_PATH.is_file(), f"missing: {DOC_PATH}"
return DOC_PATH.read_text()
def _stream_layout_rows(doc: str) -> list[tuple[str, str]]:
"""Parse the doc's "Stream layout" table -> list of (stream_name, subject_filter)."""
section_re = re.compile(
r"^## 3\. Stream layout\s*\n(.*?)(?=^## )",
re.DOTALL | re.MULTILINE,
)
m = section_re.search(doc)
assert m, "doc missing '## 3. Stream layout' section"
section = m.group(1)
rows: list[tuple[str, str]] = []
# Each row: | `CENTRAL_XX` | `central.xx.>` | ... |
row_re = re.compile(r"^\|\s*`([A-Z_]+)`\s*\|\s*`(central\.[a-z_]+\.>)`\s*\|", re.MULTILINE)
for name, subj in row_re.findall(section):
rows.append((name, subj))
return rows
def _per_adapter_subsections(doc: str) -> list[str]:
"""Pull adapter names from the per-adapter section headings: '### <adapter> — ...'.
Only counts subsections inside '## 6. Per-adapter reference'.
"""
section_re = re.compile(
r"^## 6\. Per-adapter reference\s*\n(.*?)(?=^## )",
re.DOTALL | re.MULTILINE,
)
m = section_re.search(doc)
assert m, "doc missing '## 6. Per-adapter reference' section"
section = m.group(1)
heading_re = re.compile(r"^### ([a-z0-9_]+) — ", re.MULTILINE)
return heading_re.findall(section)
def test_doc_exists():
assert DOC_PATH.is_file(), f"doc missing: {DOC_PATH}"
def test_stream_table_matches_registry():
"""Every StreamEntry in streams.py must appear in the doc's stream layout table."""
doc_rows = _stream_layout_rows(_doc_text())
doc_names = {n for n, _ in doc_rows}
doc_filters = {f for _, f in doc_rows}
code_names = {s.name for s in STREAMS}
code_filters = {s.subject_filter for s in STREAMS}
assert doc_names == code_names, (
f"stream-name drift: doc-only={doc_names - code_names}, "
f"code-only={code_names - doc_names}"
)
assert doc_filters == code_filters, (
f"subject-filter drift: doc-only={doc_filters - code_filters}, "
f"code-only={code_filters - doc_filters}"
)
def test_stream_table_name_subject_pairs_consistent():
"""Each (stream_name, subject_filter) pair in the doc must match the registry exactly.
Catches the case where someone swaps the subject filter on one stream
without updating its row.
"""
doc_rows = set(_stream_layout_rows(_doc_text()))
code_rows = {(s.name, s.subject_filter) for s in STREAMS}
assert doc_rows == code_rows, (
f"row drift: doc-only={doc_rows - code_rows}, code-only={code_rows - doc_rows}"
)
def test_every_adapter_has_a_subsection():
"""Every adapter discovered in central.adapters must have a per-adapter doc subsection."""
doc_adapters = set(_per_adapter_subsections(_doc_text()))
code_adapters = set(discover_adapters().keys())
assert doc_adapters == code_adapters, (
f"adapter coverage drift: doc-only={doc_adapters - code_adapters}, "
f"code-only={code_adapters - doc_adapters}"
)
def test_subsections_appear_in_doc_order_matches_registry_size():
"""Sanity: the count of '### <adapter>' headings inside §6 equals the registry size.
Independent count check; catches the case where one heading is duplicated.
"""
doc_adapters = _per_adapter_subsections(_doc_text())
assert len(doc_adapters) == len(set(doc_adapters)), (
f"duplicate per-adapter sections: {[a for a in doc_adapters if doc_adapters.count(a) > 1]}"
)
assert len(doc_adapters) == len(discover_adapters())
def test_castle_rock_legacy_adapters_remain_removed():
"""v0.10.3 regression guard: ``state_511_atis`` and ``state_511_atis_cameras``
were ripped out because the Castle Rock legacy ``/map/mapIcons/`` +
``/List/GetData/`` shape is end-of-life on the only Idaho source we cared
about (Idaho 511) -- the official ITD adapters (``itd_511`` + ``itd_511_cameras``,
v0.10.0) supersede them. The sister-site discovery confirmed no other
Castle Rock customer still exposes the legacy shape that this adapter pair
consumed. Re-adding either module would resurrect a dying-upstream dependency."""
registry = discover_adapters()
assert "state_511_atis" not in registry, (
"state_511_atis was removed in v0.10.3; use itd_511 (v0.10.0) instead"
)
assert "state_511_atis_cameras" not in registry, (
"state_511_atis_cameras was removed in v0.10.3; use itd_511_cameras (v0.10.0) instead"
)
adapters_dir = Path(__file__).resolve().parents[1] / "src" / "central" / "adapters"
assert not (adapters_dir / "state_511_atis.py").exists(), (
"state_511_atis.py was removed in v0.10.3; do not re-add"
)
assert not (adapters_dir / "state_511_atis_cameras.py").exists(), (
"state_511_atis_cameras.py was removed in v0.10.3; do not re-add"
)