Merge pull request #2 from rotationalphysics495/feat/design-phase-hardening

Harden epic-execute design phase: bounded context, JSON plans, critic loop
2026-06-03 06:12:52 -05:00 · 2026-06-03 06:12:52 -05:00 · f61b835eef
parent 0d08dddc96 4f0a4f4a03
commit f61b835eef
4 changed files with 478 additions and 65 deletions
--- a/scripts/epic-execute-lib/design-phase.sh
+++ b/scripts/epic-execute-lib/design-phase.sh
@ -15,6 +15,69 @@
 # Stores the last design output for passing to dev phase
 LAST_DESIGN=""

+# Stores the gaps reported by the most recent design critic pass
+DESIGN_CRITIC_GAPS=""
+
+# =============================================================================
+# Codebase Exploration (deterministic, language-aware)
+# =============================================================================
+
+# Detect the project's primary language/toolchain from marker files.
+# Mirrors the detection used by the static-analysis gate.
+# Returns one of: node | rust | go | python | unknown
+detect_project_type() {
+    if [ -f "$PROJECT_ROOT/package.json" ]; then
+        echo "node"
+    elif [ -f "$PROJECT_ROOT/Cargo.toml" ]; then
+        echo "rust"
+    elif [ -f "$PROJECT_ROOT/go.mod" ]; then
+        echo "go"
+    elif [ -f "$PROJECT_ROOT/requirements.txt" ] || [ -f "$PROJECT_ROOT/pyproject.toml" ]; then
+        echo "python"
+    else
+        echo "unknown"
+    fi
+}
+
+# Build a deterministic, bounded repository map for the planner to start from,
+# tailored to the detected language. This replaces the old hardcoded JS/TS
+# find commands and the "hope the model explores" approach with concrete,
+# pre-computed context.
+build_repo_map() {
+    local ptype
+    ptype=$(detect_project_type)
+
+    local lang_label=""
+    local find_expr=()
+    case "$ptype" in
+        node)   lang_label="Node.js / TypeScript"; find_expr=(-name '*.ts' -o -name '*.tsx' -o -name '*.js' -o -name '*.jsx') ;;
+        rust)   lang_label="Rust";                 find_expr=(-name '*.rs') ;;
+        go)     lang_label="Go";                   find_expr=(-name '*.go') ;;
+        python) lang_label="Python";               find_expr=(-name '*.py') ;;
+        *)      lang_label="Unknown" ;;
+    esac
+
+    # Top-level directory structure (excluding noise dirs)
+    local top
+    top=$(cd "$PROJECT_ROOT" 2>/dev/null && ls -d */ 2>/dev/null \
+        | grep -vE '^(node_modules|\.git|dist|build|target|vendor|__pycache__|\.venv|coverage)/' \
+        | head -30)
+
+    # Representative source files for the detected language (bounded)
+    local sources=""
+    if [ "${#find_expr[@]}" -gt 0 ]; then
+        sources=$(cd "$PROJECT_ROOT" 2>/dev/null && find . \( "${find_expr[@]}" \) \
+            -not -path '*/node_modules/*' -not -path '*/.git/*' \
+            -not -path '*/dist/*' -not -path '*/build/*' \
+            -not -path '*/target/*' -not -path '*/vendor/*' \
+            -not -path '*/__pycache__/*' -not -path '*/.venv/*' \
+            2>/dev/null | sed 's|^\./||' | head -40)
+    fi
+
+    printf 'Detected project type: %s\n\nTop-level structure:\n%s\n\nRepresentative source files:\n%s\n' \
+        "$lang_label" "${top:-(none)}" "${sources:-(none detected)}"
+}
+
 # =============================================================================
 # Design Phase Functions
 # =============================================================================
@ -32,24 +95,67 @@ execute_design_phase() {

    log ">>> DESIGN PHASE: $story_id"

+    # Story is inlined (small, bounded, and the planner needs it in full)
    local story_contents=$(cat "$story_file")

-    # Load architecture file if available
-    local arch_contents=""
+    # Locate the architecture file but pass it by PATH, not embedded contents.
+    # architecture.md is the main unbounded size risk in this prompt.
+    local arch_file=""
    for search_path in "$PROJECT_ROOT/docs/architecture.md" "$PROJECT_ROOT/docs/architecture/architecture.md" "$PROJECT_ROOT/architecture.md"; do
        if [ -f "$search_path" ]; then
-            arch_contents=$(cat "$search_path")
+            arch_file="$search_path"
            break
        fi
    done

-    # Load previous decisions for context
+    # Load previous decisions for context, bounded to the last 20KB
+    # (matches the dev phase; the decision log grows across the epic).
    local decision_context=""
    if type get_decision_log_context >/dev/null 2>&1; then
        decision_context=$(get_decision_log_context)
+        local dec_size
+        dec_size=$(get_byte_size "$decision_context")
+        if [ "$dec_size" -gt 20000 ]; then
+            decision_context=$(printf '%s' "$decision_context" | tail -c 20000)
+            [ "$VERBOSE" = true ] && log_warn "Design: decision log truncated to last 20KB"
+        fi
    fi

-    local design_prompt="You are a senior developer planning the implementation of a story.
+    # Pre-compute a deterministic, language-aware repository map (#5)
+    local repo_map=""
+    if type build_repo_map >/dev/null 2>&1; then
+        repo_map=$(build_repo_map)
+    fi
+
+    if [ "$DRY_RUN" = true ]; then
+        echo "[DRY RUN] Would execute design phase for $story_id"
+        return 0
+    fi
+
+    # Critic loop (#4): generate a plan, have a fresh-context critic check it
+    # against the ACs and architecture, and regenerate with feedback if gaps
+    # remain. Design is advisory, so we always proceed with the best plan.
+    local max_attempts="${MAX_DESIGN_CRITIC_ATTEMPTS:-2}"
+    local attempt=1
+    local feedback=""
+    local json=""
+
+    while true; do
+        # Revision block is empty on the first pass, populated by the critic
+        local revision_block=""
+        if [ -n "$feedback" ]; then
+            revision_block="## Revision Required
+
+A previous version of this plan was reviewed and found incomplete. Produce an
+improved plan that resolves ALL of the following gaps:
+
+<gaps>
+$feedback
+</gaps>
+"
+        fi
+
+        local design_prompt="You are a senior developer planning the implementation of a story.

 ## Your Task

@ -74,9 +180,7 @@ $story_contents

 ## Architecture Reference

-<architecture>
-$arch_contents
-</architecture>
+**Read the architecture document at:** ${arch_file:-"(none found)"}

 ## Previous Decisions in This Epic

@ -84,83 +188,316 @@ $arch_contents
 $decision_context
 </decision-context>

-## Exploration Commands
+## Repository Map

-First, explore the codebase to understand existing patterns:
-\`\`\`bash
-# Find similar implementations
-find . -type f -name \"*.ts\" -o -name \"*.js\" | head -20
-# Check project structure
-ls -la src/ 2>/dev/null || ls -la
-\`\`\`
+Use this pre-computed map of the codebase as your starting point, then explore
+further (read the listed files, find similar implementations) before planning.
+Follow existing patterns rather than introducing new ones.

-## Required Output
+<repo-map>
+$repo_map
+</repo-map>

-Output your implementation plan in this exact format:
+${revision_block}## Required Output

-\`\`\`
-DESIGN START
-story_id: $story_id
+Output your implementation plan as a single JSON result block. Map EVERY
+acceptance criterion in the story to the files/functions that will implement
+it - the \"ac\" field must use the exact AC identifier from the story (e.g.
+\"AC1\", \"AC2\").

-files_to_modify:
-  - path: <file path>
-    action: create|modify
-    purpose: <why this file needs changes>
-
-patterns_to_use:
-  - <pattern name>: <how it will be applied>
-
-dependencies:
-  - <package>: <installed|needs-install>
-
-acceptance_criteria_mapping:
-  - AC1: <which files/functions will implement this>
-  - AC2: <which files/functions will implement this>
-
-risks:
-  - <potential issue and mitigation>
-
-estimated_test_files:
-  - <test file path>: <what it will test>
-
-implementation_order:
-  1. <first step>
-  2. <second step>
-  ...
-DESIGN END
+\`\`\`json
+{
+  \"status\": \"COMPLETE\",
+  \"story_id\": \"$story_id\",
+  \"summary\": \"<one-line description of the planned approach>\",
+  \"files_to_modify\": [
+    {\"path\": \"<file path>\", \"action\": \"create|modify\", \"purpose\": \"<why>\"}
+  ],
+  \"patterns_to_use\": [
+    {\"pattern\": \"<pattern name>\", \"how\": \"<how it will be applied>\"}
+  ],
+  \"dependencies\": [
+    {\"package\": \"<name>\", \"state\": \"installed|needs-install\"}
+  ],
+  \"acceptance_criteria_mapping\": [
+    {\"ac\": \"AC1\", \"covered_by\": \"<files/functions implementing this AC>\"}
+  ],
+  \"risks\": [
+    {\"risk\": \"<potential issue>\", \"mitigation\": \"<how to mitigate>\"}
+  ],
+  \"test_files\": [
+    {\"path\": \"<test file path>\", \"covers\": \"<what it will test>\"}
+  ],
+  \"implementation_order\": [\"<first step>\", \"<second step>\"]
+}
 \`\`\`

 Be specific and concrete. This plan will guide the implementation phase.

+If you cannot produce a plan (e.g. the story is too ambiguous to design),
+output the same JSON block with \"status\": \"BLOCKED\" and a \"summary\"
+explaining why.
+
 ## Completion Signal

-After outputting the design block, output exactly:
+After outputting the JSON block, output exactly:
 DESIGN COMPLETE: $story_id"

-    if [ "$DRY_RUN" = true ]; then
-        echo "[DRY RUN] Would execute design phase for $story_id"
-        return 0
+        # Log prompt size in verbose mode (consistent with other phases)
+        log_prompt_size "$design_prompt" "design-phase"
+
+        # Pipe to file to avoid memory bloat
+        run_claude_to_file "$design_prompt"
+        local result
+        result=$(read_phase_tail)
+
+        # Extract the JSON plan using the shared parser (falls back to legacy
+        # text scraping if no JSON block is present, e.g. older models).
+        json=""
+        if type extract_json_result >/dev/null 2>&1; then
+            json=$(extract_json_result "$result")
+        fi
+
+        # Determine completion using the shared JSON-first checker
+        local completion_status=0
+        if type check_phase_completion >/dev/null 2>&1; then
+            check_phase_completion "$result" "design" "$story_id"
+            completion_status=$?
+        fi
+
+        if [ -n "$json" ] && [ "$completion_status" -ne 1 ]; then
+            # Valid JSON plan
+            LAST_DESIGN="$json"
+        else
+            # Fall back to legacy DESIGN START/END text block (backward compat)
+            LAST_DESIGN=$(echo "$result" | sed -n '/DESIGN START/,/DESIGN END/p')
+        fi
+
+        if [ -z "$LAST_DESIGN" ] || [ "$completion_status" -eq 1 ]; then
+            log_error "Design phase did not produce a valid plan"
+            return 1
+        fi
+
+        # Critic disabled or no attempts budgeted - accept the first plan
+        if [ "${SKIP_DESIGN_CRITIC:-false}" = true ] || [ "$max_attempts" -le 0 ]; then
+            break
+        fi
+
+        # Run the critic against the plan
+        run_design_critic "$story_file" "$story_id" "$arch_file" "$LAST_DESIGN"
+        local verdict=$?
+
+        if [ "$verdict" -ne 1 ]; then
+            # Approved (0) or unclear (2) - accept the current plan
+            if [ "$verdict" -eq 2 ]; then
+                log_warn "Design critic result unclear for $story_id - accepting current plan"
+            elif [ "$VERBOSE" = true ]; then
+                log "Design critic approved the plan: $story_id"
+            fi
+            break
+        fi
+
+        # verdict == 1: revision requested
+        if [ -z "$DESIGN_CRITIC_GAPS" ]; then
+            log_warn "Design critic requested revision but listed no actionable gaps - proceeding"
+            break
+        fi
+
+        if [ "$attempt" -ge "$max_attempts" ]; then
+            log_warn "Design still has gaps after $attempt critic attempt(s) for $story_id - proceeding with documented gaps"
+            if type add_metrics_issue >/dev/null 2>&1; then
+                add_metrics_issue "$story_id" "design_critic_gaps" "Unresolved design gaps after $attempt critic attempt(s)"
+            fi
+            break
+        fi
+
+        log_warn "Design critic requested revisions (attempt $attempt of $max_attempts) for $story_id - regenerating plan"
+        feedback="$DESIGN_CRITIC_GAPS"
+        attempt=$((attempt + 1))
+    done
+
+    # Persist the plan to a per-story file so the dev phase can read it
+    # even after a resume (when the in-memory LAST_DESIGN is empty).
+    persist_design "$story_id" "$LAST_DESIGN"
+
+    # Validate that every acceptance criterion is mapped (advisory warning).
+    validate_design_coverage "$story_file" "$story_id" "$json"
+
+    # Save to decision log
+    if type append_to_decision_log >/dev/null 2>&1; then
+        append_to_decision_log "DESIGN" "$story_id" "$LAST_DESIGN"
    fi

-    # Pipe to file to avoid memory bloat
-    run_claude_to_file "$design_prompt"
+    log_success "Design phase complete: $story_id"
+    return 0
+}
+
+# Run a fresh-context critic pass over a proposed design plan (#4).
+# The critic checks two things: (a) does the plan map every acceptance
+# criterion, and (b) does it conform to the architecture. Gaps are stored in
+# DESIGN_CRITIC_GAPS for feedback into a regeneration pass.
+# Arguments:
+#   $1 - story_file path
+#   $2 - story_id
+#   $3 - architecture file path (may be empty)
+#   $4 - the proposed plan (JSON or text)
+# Returns: 0 approved, 1 needs revision, 2 unclear
+run_design_critic() {
+    local story_file="$1"
+    local story_id="$2"
+    local arch_file="$3"
+    local plan="$4"
+
+    DESIGN_CRITIC_GAPS=""
+
+    local story_contents
+    story_contents=$(cat "$story_file")
+
+    local critic_prompt="You are a skeptical senior engineer reviewing an implementation PLAN before any code is written.
+
+## Your Task
+
+Critique the proposed plan for story: $story_id
+
+You are reviewing a PLAN, not code. Be rigorous. Decide whether the plan:
+1. Maps EVERY acceptance criterion in the story to concrete files/functions
+2. Conforms to the project's architecture
+3. Is concrete and actionable (no vague hand-waving)
+
+## Story
+
+<story>
+$story_contents
+</story>
+
+## Architecture Reference
+
+**Read the architecture document at:** ${arch_file:-"(none found)"}
+
+## Proposed Plan
+
+<plan>
+$plan
+</plan>
+
+## Required Output
+
+Output a single JSON result block:
+
+\`\`\`json
+{
+  \"status\": \"APPROVED\" | \"NEEDS_REVISION\",
+  \"story_id\": \"$story_id\",
+  \"gaps\": [
+    {\"issue\": \"<what is missing or wrong>\", \"recommendation\": \"<how to fix it>\"}
+  ]
+}
+\`\`\`
+
+Use APPROVED only if the plan covers every acceptance criterion and conforms to
+the architecture. Otherwise use NEEDS_REVISION and list specific, actionable gaps.
+
+## Completion Signal
+
+After the JSON block, output exactly one of:
+DESIGN CRITIC APPROVED: $story_id
+DESIGN CRITIC NEEDS_REVISION: $story_id"
+
+    log_prompt_size "$critic_prompt" "design-critic"
+
+    run_claude_to_file "$critic_prompt"
    local result
    result=$(read_phase_tail)

-    # Extract design block
-    LAST_DESIGN=$(echo "$result" | sed -n '/DESIGN START/,/DESIGN END/p')
+    # Parse verdict + gaps (JSON first, text fallback)
+    local status=""
+    local cjson=""
+    if type extract_json_result >/dev/null 2>&1; then
+        cjson=$(extract_json_result "$result")
+    fi

-    if [ -n "$LAST_DESIGN" ]; then
-        # Save to decision log
-        if type append_to_decision_log >/dev/null 2>&1; then
-            append_to_decision_log "DESIGN" "$story_id" "$LAST_DESIGN"
+    if [ -n "$cjson" ] && command -v jq >/dev/null 2>&1; then
+        status=$(echo "$cjson" | jq -r '.status // empty' | tr '[:lower:]' '[:upper:]')
+        DESIGN_CRITIC_GAPS=$(echo "$cjson" | jq -r '.gaps[]? | "- \(.issue) -> \(.recommendation)"' 2>/dev/null || echo "")
+    fi
+
+    # Text fallback if JSON missing/unparseable
+    if [ -z "$status" ]; then
+        if echo "$result" | grep -q "DESIGN CRITIC APPROVED"; then
+            status="APPROVED"
+        elif echo "$result" | grep -q "DESIGN CRITIC NEEDS_REVISION"; then
+            status="NEEDS_REVISION"
        fi
+    fi

-        log_success "Design phase complete: $story_id"
+    case "$status" in
+        APPROVED)       return 0 ;;
+        NEEDS_REVISION) return 1 ;;
+        *)              return 2 ;;
+    esac
+}
+
+# Validate that the design plan maps every acceptance criterion in the story.
+# This is advisory: it warns and records a metric but never fails the story
+# (design is a non-blocking phase). AC extraction is heuristic since story
+# formats vary; if no ACs are detected the check is skipped.
+# Arguments:
+#   $1 - story_file path
+#   $2 - story_id
+#   $3 - JSON plan (may be empty if the model fell back to text output)
+validate_design_coverage() {
+    local story_file="$1"
+    local story_id="$2"
+    local json="$3"
+
+    # Coverage check requires jq and a JSON plan; skip otherwise.
+    if [ -z "$json" ] || ! command -v jq >/dev/null 2>&1; then
        return 0
+    fi
+
+    # Count distinct AC identifiers declared in the story (e.g. AC1, AC2, ...).
+    local ac_count
+    ac_count=$(grep -oiE '\bAC[0-9]+\b' "$story_file" 2>/dev/null | tr '[:lower:]' '[:upper:]' | sort -u | wc -l | tr -d ' ')
+
+    if [ "${ac_count:-0}" -eq 0 ]; then
+        # No recognizable AC identifiers in this story - nothing to validate.
+        return 0
+    fi
+
+    # Count distinct ACs the plan claims to cover.
+    local mapped
+    mapped=$(echo "$json" | jq -r '[.acceptance_criteria_mapping[]?.ac] | map(ascii_upcase) | unique | length' 2>/dev/null || echo 0)
+    mapped=$(echo "$mapped" | tr -d '[:space:]')
+    [ -z "$mapped" ] && mapped=0
+
+    if [ "$mapped" -lt "$ac_count" ]; then
+        log_warn "Design maps $mapped of $ac_count acceptance criteria for $story_id"
+        if type add_metrics_issue >/dev/null 2>&1; then
+            add_metrics_issue "$story_id" "design_incomplete" "Plan maps $mapped/$ac_count acceptance criteria"
+        fi
    else
-        log_error "Design phase did not produce valid output"
-        return 1
+        [ "$VERBOSE" = true ] && log "Design covers all $ac_count acceptance criteria for $story_id"
+    fi
+}
+
+# Persist a design plan to a per-story file under DESIGN_DIR.
+# Arguments:
+#   $1 - story_id
+#   $2 - design content
+persist_design() {
+    local story_id="$1"
+    local content="$2"
+
+    if [ -z "${DESIGN_DIR:-}" ]; then
+        return 0
+    fi
+
+    mkdir -p "$DESIGN_DIR" 2>/dev/null || true
+    local design_file="$DESIGN_DIR/${story_id}-design.md"
+    if printf '%s\n' "$content" > "$design_file" 2>/dev/null; then
+        [ "$VERBOSE" = true ] && log "Design plan saved: $design_file"
+    else
+        log_warn "Failed to persist design plan: $design_file"
    fi
 }

@ -170,12 +507,64 @@ get_last_design() {
    echo "$LAST_DESIGN"
 }

+# Build a focused "planned test files" context block from the design plan (#7).
+# Lets the TDD test-spec phase reuse the test files the design already proposed,
+# rather than independently deciding the test surface. Reads the in-memory plan
+# first, then the persisted file (resume-safe). Requires a JSON plan + jq.
+# Arguments:
+#   $1 - story_id
+build_planned_test_files_context() {
+    local story_id="$1"
+
+    local design="$LAST_DESIGN"
+    if [ -z "$design" ] && [ -n "${DESIGN_DIR:-}" ]; then
+        local design_file="$DESIGN_DIR/${story_id}-design.md"
+        [ -f "$design_file" ] && design=$(cat "$design_file")
+    fi
+
+    if [ -z "$design" ] || ! command -v jq >/dev/null 2>&1; then
+        echo ""
+        return
+    fi
+
+    local files
+    files=$(echo "$design" | jq -r '.test_files[]? | "- \(.path): \(.covers)"' 2>/dev/null || echo "")
+
+    if [ -z "$files" ]; then
+        echo ""
+        return
+    fi
+
+    cat << EOF
+
+## Planned Test Files (from design phase)
+
+The design phase already identified the intended test files below. Align your
+specifications with these paths and reuse them; only introduce a new test file
+when a scenario genuinely isn't covered here, and call out any deviation.
+
+<planned-test-files>
+$files
+</planned-test-files>
+EOF
+}
+
 # Build the design context block for dev phase prompt
 # Returns formatted design context for inclusion in prompts
 build_design_context_for_dev() {
    local story_id="$1"

-    if [ -z "$LAST_DESIGN" ]; then
+    # Prefer the in-memory plan; fall back to the persisted file so a resumed
+    # run (where LAST_DESIGN is empty) still gets the design context.
+    local design="$LAST_DESIGN"
+    if [ -z "$design" ] && [ -n "${DESIGN_DIR:-}" ]; then
+        local design_file="$DESIGN_DIR/${story_id}-design.md"
+        if [ -f "$design_file" ]; then
+            design=$(cat "$design_file")
+        fi
+    fi
+
+    if [ -z "$design" ]; then
        echo ""
        return
    fi
@ -186,7 +575,7 @@ build_design_context_for_dev() {
 The following design was created in the planning phase. Follow this plan:

 <design-plan>
-$LAST_DESIGN
+$design
 </design-plan>

 ### Implementation Guidelines Based on Design
--- a/scripts/epic-execute-lib/json-output.sh
+++ b/scripts/epic-execute-lib/json-output.sh
@ -299,6 +299,13 @@ check_phase_completion() {

    # Fallback to legacy text-based parsing
    case "$phase_type" in
+        design)
+            if echo "$output" | grep -q "DESIGN COMPLETE"; then
+                return 0
+            elif echo "$output" | grep -q "DESIGN BLOCKED"; then
+                return 1
+            fi
+            ;;
        dev)
            if echo "$output" | grep -q "IMPLEMENTATION COMPLETE"; then
                return 0
--- a/scripts/epic-execute-lib/tdd-flow.sh
+++ b/scripts/epic-execute-lib/tdd-flow.sh
@ -54,6 +54,13 @@ execute_test_spec_phase() {
        design_context=$(get_last_design)
    fi

+    # Get the test files the design phase already planned, so the test-spec
+    # phase reuses them instead of deciding the test surface independently (#7).
+    local planned_tests=""
+    if type build_planned_test_files_context >/dev/null 2>&1; then
+        planned_tests=$(build_planned_test_files_context "$story_id")
+    fi
+
    local spec_prompt="You are a Test Architect (TEA) generating test specifications from acceptance criteria.

 ## Your Task
@ -89,7 +96,7 @@ $arch_contents
 <design>
 $design_context
 </design>
-
+$planned_tests
 ## Exploration Commands

 First, explore existing test patterns in the codebase:
--- a/scripts/epic-execute.sh
+++ b/scripts/epic-execute.sh
@ -139,6 +139,8 @@ SPRINTS_DIR="$PROJECT_ROOT/docs/sprints"
 EPICS_DIR="$PROJECT_ROOT/docs/epics"
 UAT_DIR="$PROJECT_ROOT/docs/uat"
 LOGS_DIR="$SPRINT_ARTIFACTS_DIR/logs"
+# Per-story design plans (persisted so dev phase can read them after resume)
+DESIGN_DIR="$SPRINT_ARTIFACTS_DIR/design"

 # Temporary log file during execution - will be copied to LOGS_DIR on completion
 LOG_FILE="/tmp/bmad-epic-execute-$$.log"
@ -934,6 +936,7 @@ OPTIONS:

    TDD/Testing Options:
      --skip-design         Skip pre-implementation design phase
+      --skip-design-critic  Skip the design plan critic/revision loop
      --skip-tdd            Skip all test-first development phases
      --skip-test-spec      Skip test specification phase only
      --skip-test-impl      Skip test implementation phase only
@ -974,6 +977,7 @@ ENVIRONMENT VARIABLES:
    MAX_PROMPT_SIZE         Maximum prompt size in bytes (default: 150000)
    RETRY_MAX_ATTEMPTS      Max retry attempts for transient failures (default: 3)
    RETRY_INITIAL_DELAY     Initial retry delay in seconds (default: 5)
+    MAX_DESIGN_CRITIC_ATTEMPTS  Max design plan revision rounds (default: 2)

 FILES:
    Logs:       docs/sprint-artifacts/logs/epic-<id>-<timestamp>.log
@ -1003,6 +1007,7 @@ SKIP_TEST_QUALITY=false
 SKIP_TRACEABILITY=false
 SKIP_STATIC_ANALYSIS=false
 SKIP_DESIGN=false
+SKIP_DESIGN_CRITIC=false
 SKIP_REGRESSION=false
 SKIP_TDD=false
 SKIP_TEST_SPEC=false
@ -1071,6 +1076,10 @@ while [[ $# -gt 0 ]]; do
            SKIP_DESIGN=true
            shift
            ;;
+        --skip-design-critic)
+            SKIP_DESIGN_CRITIC=true
+            shift
+            ;;
        --skip-regression)
            SKIP_REGRESSION=true
            shift
@ -1118,6 +1127,7 @@ if [ -z "$EPIC_ID" ]; then
    echo "  --skip-traceability  Skip traceability check (not recommended)"
    echo "  --skip-static-analysis  Skip static analysis gate (runs real tooling)"
    echo "  --skip-design     Skip pre-implementation design phase"
+    echo "  --skip-design-critic  Skip the design plan critic/revision loop"
    echo "  --skip-regression Skip regression test gate"
    echo "  --skip-tdd        Skip test-first development phases"
    echo "  --skip-test-spec  Skip test specification phase only"