BMAD-METHOD/src/bmm-skills/3-solutioning/bmad-architecture/scripts/tests/test_lint_spine.py

271 lines
9.7 KiB
Python

# /// script
# requires-python = ">=3.10"
# dependencies = ["pytest>=8.0"]
# ///
"""Tests for lint_spine.py. Run: uv run --with pytest pytest scripts/tests/test_lint_spine.py
The spine under test: a clean spine lints empty; the linter catches exactly the
mechanical defects a prompt is unreliable at — literal placeholders, AD-n id breakage,
AD-n blocks missing required fields, and unpinned Stack versions.
"""
import importlib.util
import json
import re
import sys
from pathlib import Path
import pytest
_SPEC = importlib.util.spec_from_file_location(
"lint_spine", Path(__file__).resolve().parent.parent / "lint_spine.py"
)
lint_spine = importlib.util.module_from_spec(_SPEC)
sys.modules["lint_spine"] = lint_spine
_SPEC.loader.exec_module(lint_spine)
CLEAN = """---
name: 'Demo'
---
## Invariants & Rules
### AD-1 — single write path
- **Binds:** all
- **Prevents:** divergent mutation
- **Rule:** state changes only through the command bus
### AD-2 — layered deps `[ADOPTED]`
- **Binds:** all
- **Prevents:** import cycles
- **Rule:** ui -> app -> domain, never backward
```mermaid
flowchart LR
A --> B{decision}
```
## Stack
| Name | Version |
| --- | --- |
| fastapi | 0.115 |
| pydantic | 2.9 |
"""
def cats(result):
return sorted(f["category"] for f in result["findings"])
def test_clean_spine_passes():
result = lint_spine.lint(CLEAN)
assert result["ok"] is True
assert result["total_findings"] == 0
def test_mermaid_braces_not_flagged():
# the {decision} node lives in a fenced block and must not read as a template token
result = lint_spine.lint(CLEAN)
assert "placeholder" not in cats(result)
def test_placeholder_markers_caught():
text = CLEAN.replace("the command bus", "TBD")
result = lint_spine.lint(text)
assert "placeholder" in cats(result)
def test_similar_to_caught():
text = CLEAN.replace("import cycles", "similar to AD-1")
result = lint_spine.lint(text)
assert any("cross-reference" in f["detail"] for f in result["findings"])
def test_unfilled_template_token_caught():
text = CLEAN.replace("single write path", "{decision}")
result = lint_spine.lint(text)
assert any(f["category"] == "placeholder" for f in result["findings"])
def test_duplicate_ad_id_caught():
text = CLEAN.replace("### AD-2 — layered deps `[ADOPTED]`", "### AD-1 — layered deps")
result = lint_spine.lint(text)
assert "ad_id" in cats(result)
def test_non_monotonic_ad_id_caught():
text = CLEAN.replace("### AD-2 — layered deps `[ADOPTED]`", "### AD-5 — layered deps").replace(
"### AD-1 — single write path", "### AD-9 — single write path"
)
result = lint_spine.lint(text)
assert any("non-monotonic" in f["detail"] for f in result["findings"])
def test_missing_field_caught():
text = CLEAN.replace("- **Rule:** state changes only through the command bus\n", "")
result = lint_spine.lint(text)
assert any(f["category"] == "ad_fields" and "rule" in f["detail"] for f in result["findings"])
def test_unpinned_dep_caught():
text = CLEAN.replace("| fastapi | 0.115 |", "| fastapi | |")
result = lint_spine.lint(text)
assert "version_pin" in cats(result)
def test_placeholder_version_caught():
text = CLEAN.replace("| fastapi | 0.115 |", "| fastapi | {pin} |")
result = lint_spine.lint(text)
assert any(f["category"] == "version_pin" and "fastapi" in f["detail"] for f in result["findings"])
def test_no_stack_section_ok():
text = CLEAN.split("## Stack")[0]
result = lint_spine.lint(text)
assert "version_pin" not in cats(result)
def test_stack_skeleton_row_not_version_pinned():
# a leftover {token} name is the placeholder pass's job, not a double-reported version_pin
text = CLEAN.replace("| fastapi | 0.115 |", "| {language / framework} | {pinned version} |")
result = lint_spine.lint(text)
assert "version_pin" not in cats(result)
def test_stack_html_comment_not_parsed_as_row():
text = CLEAN.replace("## Stack\n", "## Stack\n\n<!-- SEED — verified current 2026-06 -->\n")
result = lint_spine.lint(text)
assert "version_pin" not in cats(result)
def test_template_token_is_low_severity():
# a bare {token} can be legitimate brace prose; it is flagged, but low (not high) so the
# mechanical pass stays near-zero false-positive
text = CLEAN.replace("single write path", "{decision}")
result = lint_spine.lint(text)
toks = [f for f in result["findings"] if f["category"] == "placeholder" and "template token" in f["detail"]]
assert toks and all(f["severity"] == "low" for f in toks)
def test_no_frontmatter_body_still_scanned():
text = "## Invariants\n\n### AD-1 — x\n\n- **Binds:** all\n- **Prevents:** drift\n- **Rule:** TBD\n"
result = lint_spine.lint(text)
assert "placeholder" in cats(result) # TBD caught even with no frontmatter
def test_frontmatter_value_with_dashes_not_truncated():
# a value containing '---' must not be read as the closing fence (line-exact close)
text = ("---\nname: 'x'\nscope: 'phase 1 --- phase 2'\n---\n\n"
"## Stack\n\n| Name | Version |\n| --- | --- |\n| fastapi | |\n")
result = lint_spine.lint(text)
assert any(f["category"] == "version_pin" for f in result["findings"]) # read past the inline ---
def test_ad_heading_in_fence_not_counted():
text = (
"---\nname: 'x'\n---\n\n"
"### AD-1 — real\n\n- **Binds:** all\n- **Prevents:** drift\n- **Rule:** do x\n\n"
"## Docs\n\n```text\n### AD-2 — illustrative only, no fields\n```\n"
)
result = lint_spine.lint(text)
assert result["ok"] is True # the fenced AD-2 is not a live AD → no ad_fields/ad_id finding
def test_stack_table_flags_only_the_unpinned_row():
text = ("---\nname: 'x'\n---\n\n## Stack\n\n| Name | Version |\n| --- | --- |\n"
"| fastapi | 0.115 |\n| redis | |\n")
result = lint_spine.lint(text)
pins = [f for f in result["findings"] if f["category"] == "version_pin"]
assert len(pins) == 1 and "redis" in pins[0]["detail"]
def test_stack_table_all_pinned_ok():
text = ("---\nname: 'x'\n---\n\n## Stack\n\n| Name | Version |\n| --- | --- |\n"
"| fastapi | 0.115 |\n")
result = lint_spine.lint(text)
assert "version_pin" not in cats(result)
def test_fenced_stack_rows_not_parsed():
# an illustrative fenced table under ## Stack must not be read as live rows (fences are
# blanked first, like every other pass) — a blank-version row inside a fence is not a finding
text = ("---\nname: 'x'\n---\n\n## Stack\n\n| Name | Version |\n| --- | --- |\n"
"| fastapi | 0.115 |\n\n```text\n| example | |\n```\n")
result = lint_spine.lint(text)
assert "version_pin" not in cats(result)
def test_fenced_stack_heading_not_live():
# a `## Stack` heading shown inside a code fence is not the live Stack section
text = ("---\nname: 'x'\n---\n\n## Docs\n\n```md\n## Stack\n\n| foo | |\n```\n")
result = lint_spine.lint(text)
assert "version_pin" not in cats(result)
def test_renamed_stack_heading_still_scanned():
# the heading match is word-boundary, so a varied `## Stack` heading still counts
text = ("---\nname: 'x'\n---\n\n## Stack & Versions\n\n| Name | Version |\n| --- | --- |\n"
"| redis | |\n")
result = lint_spine.lint(text)
pins = [f for f in result["findings"] if f["category"] == "version_pin"]
assert len(pins) == 1 and "redis" in pins[0]["detail"]
def test_reordered_columns_pair_name_to_version():
# Version-then-Name header: the unpinned row must still be flagged by its real name
text = ("---\nname: 'x'\n---\n\n## Stack\n\n| Version | Name |\n| --- | --- |\n"
"| 0.115 | fastapi |\n| | redis |\n")
result = lint_spine.lint(text)
pins = [f for f in result["findings"] if f["category"] == "version_pin"]
assert len(pins) == 1 and "redis" in pins[0]["detail"]
def test_placeholder_line_number_is_absolute():
# a TBD after a multi-line fence reports its real file line (fence blanked, not collapsed)
text = (
"---\nname: 'x'\n---\n\n"
"## A\n\n"
"```text\nf1\nf2\nf3\n```\n\n"
"TBD here\n"
)
result = lint_spine.lint(text)
ph = next(f for f in result["findings"] if "TBD" in f["detail"])
n = int(re.search(r"line (\d+)", ph["location"]).group(1))
assert n == 13
def test_missing_spine_file_reports_error(tmp_path, capsys):
rc = lint_spine.main(["--workspace", str(tmp_path)])
out = json.loads(capsys.readouterr().out)
assert rc == 0 and out["ok"] is False and "not found" in out["error"]
def test_frontmatter_unfilled_token_caught():
# an unfilled {scope}/{paradigm}/{date} in frontmatter is part of the contract and must lint
text = "---\nname: 'x'\nscope: '{what this spine governs}'\n---\n\n## Invariants\n"
result = lint_spine.lint(text)
fm = [f for f in result["findings"] if f["category"] == "placeholder" and "frontmatter" in f["detail"]]
assert fm and any("template token" in f["detail"] for f in fm)
def test_frontmatter_tbd_caught():
text = "---\nname: 'x'\nstatus: TBD\n---\n\n## Invariants\n"
result = lint_spine.lint(text)
assert any(f["category"] == "placeholder" and "frontmatter" in f["detail"] and "TBD" in f["detail"]
for f in result["findings"])
def test_unreadable_spine_returns_error_not_crash(tmp_path, capsys):
# a spine that exists but can't be UTF-8 decoded must yield error JSON + exit 0, not a traceback
(tmp_path / lint_spine.SPINE).write_bytes(b"\xff\xfe bad bytes not utf-8")
rc = lint_spine.main(["--workspace", str(tmp_path)])
out = json.loads(capsys.readouterr().out)
assert rc == 0 and out["ok"] is False and "could not read" in out["error"]
if __name__ == "__main__":
sys.exit(pytest.main([__file__, "-q"]))