BMAD-METHOD/src/bmm-skills/3-solutioning/bmad-architecture/scripts/tests/test_lint_spine.py

# /// script
# requires-python = ">=3.10"
# dependencies = ["pytest>=8.0"]
# ///
"""Tests for lint_spine.py. Run: uv run --with pytest pytest scripts/tests/test_lint_spine.py

The spine under test: a clean spine lints empty; the linter catches exactly the
mechanical defects a prompt is unreliable at — literal placeholders, AD-n id breakage,
AD-n blocks missing required fields, and unpinned Stack versions.
"""
import importlib.util
import json
import re
import sys
from pathlib import Path

import pytest

_SPEC = importlib.util.spec_from_file_location(
    "lint_spine", Path(__file__).resolve().parent.parent / "lint_spine.py"
)
lint_spine = importlib.util.module_from_spec(_SPEC)
sys.modules["lint_spine"] = lint_spine
_SPEC.loader.exec_module(lint_spine)


CLEAN = """---
name: 'Demo'
---

## Invariants & Rules

### AD-1 — single write path

- **Binds:** all
- **Prevents:** divergent mutation
- **Rule:** state changes only through the command bus

### AD-2 — layered deps `[ADOPTED]`

- **Binds:** all
- **Prevents:** import cycles
- **Rule:** ui -> app -> domain, never backward

```mermaid
flowchart LR
  A --> B{decision}
```

## Stack

| Name | Version |
| --- | --- |
| fastapi | 0.115 |
| pydantic | 2.9 |
"""


def cats(result):
    return sorted(f["category"] for f in result["findings"])


def test_clean_spine_passes():
    result = lint_spine.lint(CLEAN)
    assert result["ok"] is True
    assert result["total_findings"] == 0


def test_mermaid_braces_not_flagged():
    # the {decision} node lives in a fenced block and must not read as a template token
    result = lint_spine.lint(CLEAN)
    assert "placeholder" not in cats(result)


def test_placeholder_markers_caught():
    text = CLEAN.replace("the command bus", "TBD")
    result = lint_spine.lint(text)
    assert "placeholder" in cats(result)


def test_similar_to_caught():
    text = CLEAN.replace("import cycles", "similar to AD-1")
    result = lint_spine.lint(text)
    assert any("cross-reference" in f["detail"] for f in result["findings"])


def test_unfilled_template_token_caught():
    text = CLEAN.replace("single write path", "{decision}")
    result = lint_spine.lint(text)
    assert any(f["category"] == "placeholder" for f in result["findings"])


def test_duplicate_ad_id_caught():
    text = CLEAN.replace("### AD-2 — layered deps `[ADOPTED]`", "### AD-1 — layered deps")
    result = lint_spine.lint(text)
    assert "ad_id" in cats(result)


def test_non_monotonic_ad_id_caught():
    text = CLEAN.replace("### AD-2 — layered deps `[ADOPTED]`", "### AD-5 — layered deps").replace(
        "### AD-1 — single write path", "### AD-9 — single write path"
    )
    result = lint_spine.lint(text)
    assert any("non-monotonic" in f["detail"] for f in result["findings"])


def test_missing_field_caught():
    text = CLEAN.replace("- **Rule:** state changes only through the command bus\n", "")
    result = lint_spine.lint(text)
    assert any(f["category"] == "ad_fields" and "rule" in f["detail"] for f in result["findings"])


def test_unpinned_dep_caught():
    text = CLEAN.replace("| fastapi | 0.115 |", "| fastapi |  |")
    result = lint_spine.lint(text)
    assert "version_pin" in cats(result)


def test_placeholder_version_caught():
    text = CLEAN.replace("| fastapi | 0.115 |", "| fastapi | {pin} |")
    result = lint_spine.lint(text)
    assert any(f["category"] == "version_pin" and "fastapi" in f["detail"] for f in result["findings"])


def test_no_stack_section_ok():
    text = CLEAN.split("## Stack")[0]
    result = lint_spine.lint(text)
    assert "version_pin" not in cats(result)


def test_stack_skeleton_row_not_version_pinned():
    # a leftover {token} name is the placeholder pass's job, not a double-reported version_pin
    text = CLEAN.replace("| fastapi | 0.115 |", "| {language / framework} | {pinned version} |")
    result = lint_spine.lint(text)
    assert "version_pin" not in cats(result)


def test_stack_html_comment_not_parsed_as_row():
    text = CLEAN.replace("## Stack\n", "## Stack\n\n<!-- SEED — verified current 2026-06 -->\n")
    result = lint_spine.lint(text)
    assert "version_pin" not in cats(result)


def test_template_token_is_low_severity():
    # a bare {token} can be legitimate brace prose; it is flagged, but low (not high) so the
    # mechanical pass stays near-zero false-positive
    text = CLEAN.replace("single write path", "{decision}")
    result = lint_spine.lint(text)
    toks = [f for f in result["findings"] if f["category"] == "placeholder" and "template token" in f["detail"]]
    assert toks and all(f["severity"] == "low" for f in toks)


def test_no_frontmatter_body_still_scanned():
    text = "## Invariants\n\n### AD-1 — x\n\n- **Binds:** all\n- **Prevents:** drift\n- **Rule:** TBD\n"
    result = lint_spine.lint(text)
    assert "placeholder" in cats(result)  # TBD caught even with no frontmatter


def test_frontmatter_value_with_dashes_not_truncated():
    # a value containing '---' must not be read as the closing fence (line-exact close)
    text = ("---\nname: 'x'\nscope: 'phase 1 --- phase 2'\n---\n\n"
            "## Stack\n\n| Name | Version |\n| --- | --- |\n| fastapi |  |\n")
    result = lint_spine.lint(text)
    assert any(f["category"] == "version_pin" for f in result["findings"])  # read past the inline ---


def test_ad_heading_in_fence_not_counted():
    text = (
        "---\nname: 'x'\n---\n\n"
        "### AD-1 — real\n\n- **Binds:** all\n- **Prevents:** drift\n- **Rule:** do x\n\n"
        "## Docs\n\n```text\n### AD-2 — illustrative only, no fields\n```\n"
    )
    result = lint_spine.lint(text)
    assert result["ok"] is True  # the fenced AD-2 is not a live AD → no ad_fields/ad_id finding


def test_stack_table_flags_only_the_unpinned_row():
    text = ("---\nname: 'x'\n---\n\n## Stack\n\n| Name | Version |\n| --- | --- |\n"
            "| fastapi | 0.115 |\n| redis |  |\n")
    result = lint_spine.lint(text)
    pins = [f for f in result["findings"] if f["category"] == "version_pin"]
    assert len(pins) == 1 and "redis" in pins[0]["detail"]


def test_stack_table_all_pinned_ok():
    text = ("---\nname: 'x'\n---\n\n## Stack\n\n| Name | Version |\n| --- | --- |\n"
            "| fastapi | 0.115 |\n")
    result = lint_spine.lint(text)
    assert "version_pin" not in cats(result)


def test_fenced_stack_rows_not_parsed():
    # an illustrative fenced table under ## Stack must not be read as live rows (fences are
    # blanked first, like every other pass) — a blank-version row inside a fence is not a finding
    text = ("---\nname: 'x'\n---\n\n## Stack\n\n| Name | Version |\n| --- | --- |\n"
            "| fastapi | 0.115 |\n\n```text\n| example |  |\n```\n")
    result = lint_spine.lint(text)
    assert "version_pin" not in cats(result)


def test_fenced_stack_heading_not_live():
    # a `## Stack` heading shown inside a code fence is not the live Stack section
    text = ("---\nname: 'x'\n---\n\n## Docs\n\n```md\n## Stack\n\n| foo |  |\n```\n")
    result = lint_spine.lint(text)
    assert "version_pin" not in cats(result)


def test_renamed_stack_heading_still_scanned():
    # the heading match is word-boundary, so a varied `## Stack` heading still counts
    text = ("---\nname: 'x'\n---\n\n## Stack & Versions\n\n| Name | Version |\n| --- | --- |\n"
            "| redis |  |\n")
    result = lint_spine.lint(text)
    pins = [f for f in result["findings"] if f["category"] == "version_pin"]
    assert len(pins) == 1 and "redis" in pins[0]["detail"]


def test_reordered_columns_pair_name_to_version():
    # Version-then-Name header: the unpinned row must still be flagged by its real name
    text = ("---\nname: 'x'\n---\n\n## Stack\n\n| Version | Name |\n| --- | --- |\n"
            "| 0.115 | fastapi |\n|  | redis |\n")
    result = lint_spine.lint(text)
    pins = [f for f in result["findings"] if f["category"] == "version_pin"]
    assert len(pins) == 1 and "redis" in pins[0]["detail"]


def test_placeholder_line_number_is_absolute():
    # a TBD after a multi-line fence reports its real file line (fence blanked, not collapsed)
    text = (
        "---\nname: 'x'\n---\n\n"
        "## A\n\n"
        "```text\nf1\nf2\nf3\n```\n\n"
        "TBD here\n"
    )
    result = lint_spine.lint(text)
    ph = next(f for f in result["findings"] if "TBD" in f["detail"])
    n = int(re.search(r"line (\d+)", ph["location"]).group(1))
    assert n == 13


def test_missing_spine_file_reports_error(tmp_path, capsys):
    rc = lint_spine.main(["--workspace", str(tmp_path)])
    out = json.loads(capsys.readouterr().out)
    assert rc == 0 and out["ok"] is False and "not found" in out["error"]


def test_frontmatter_unfilled_token_caught():
    # an unfilled {scope}/{paradigm}/{date} in frontmatter is part of the contract and must lint
    text = "---\nname: 'x'\nscope: '{what this spine governs}'\n---\n\n## Invariants\n"
    result = lint_spine.lint(text)
    fm = [f for f in result["findings"] if f["category"] == "placeholder" and "frontmatter" in f["detail"]]
    assert fm and any("template token" in f["detail"] for f in fm)


def test_frontmatter_tbd_caught():
    text = "---\nname: 'x'\nstatus: TBD\n---\n\n## Invariants\n"
    result = lint_spine.lint(text)
    assert any(f["category"] == "placeholder" and "frontmatter" in f["detail"] and "TBD" in f["detail"]
               for f in result["findings"])


def test_unreadable_spine_returns_error_not_crash(tmp_path, capsys):
    # a spine that exists but can't be UTF-8 decoded must yield error JSON + exit 0, not a traceback
    (tmp_path / lint_spine.SPINE).write_bytes(b"\xff\xfe bad bytes not utf-8")
    rc = lint_spine.main(["--workspace", str(tmp_path)])
    out = json.loads(capsys.readouterr().out)
    assert rc == 0 and out["ok"] is False and "could not read" in out["error"]


if __name__ == "__main__":
    sys.exit(pytest.main([__file__, "-q"]))