From 1e06b6a5c6601afcf8b822d3820d3cf5a3c2319f Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Mon, 16 Mar 2026 10:59:13 -0500
Subject: [PATCH 01/22] fix: dynamic base branch detection across all SKILL
 templates (v0.3.10) (#81)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* feat: add {{BASE_BRANCH_DETECT}} resolver to gen-skill-docs

DRY placeholder for dynamic base branch detection across PR-targeting
skills. Detects via gh pr view (existing PR base) → gh repo view
(repo default) → fallback to main.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* fix: ship skill detects base branch instead of hardcoding main

Replaces ~14 hardcoded 'main' references with dynamic detection via
{{BASE_BRANCH_DETECT}}. Fixes stacked branches and Conductor workspaces
targeting non-main branches. Adds --base <base> to gh pr create.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* fix: review, qa, plan-ceo-review detect base branch dynamically

Same pattern as ship: replaces hardcoded 'main' with {{BASE_BRANCH_DETECT}}.
Also cleans up qa bash-isms (REPORT_DIR variable, port chaining).

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* fix: retro detects default branch instead of hardcoding origin/main

Retro queries commit history (not PR targets), so uses simpler detection:
gh repo view defaultBranchRef. Replaces ~11 origin/main refs with
origin/<default>.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: add explicit cross-step references in gstack-upgrade template

Bash blocks are self-contained, but cross-block variable references
(INSTALL_DIR from Step 2) were implicit. Adds prose making them explicit.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs+test: SKILL authoring guidance + regression tests

Adds "Writing SKILL templates" section to CLAUDE.md explaining that
templates are prompts, not scripts. Adds validation test catching
hardcoded 'main' in git commands, and resolver content test.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: update ARCHITECTURE + CONTRIBUTING for new placeholders

Add {{BASE_BRANCH_DETECT}} to ARCHITECTURE.md placeholder list.
Cross-reference CLAUDE.md template authoring guidance from CONTRIBUTING.md.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* chore: bump version and changelog (v0.3.10)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* fix: add missing blank line between resolver functions

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* test: add 3 E2E smoke tests for base branch detection

- /review: verifies Step 0 detection + git diff against detected base
- /ship: truncated dry-run (Steps 0-1 only, no push/PR), asserts no
  destructive actions
- /retro: verifies default branch detection for git log queries

Covers the {{BASE_BRANCH_DETECT}} resolver path (review), the ship
template's dual abort check, and retro's inline detection pattern.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* chore: bump version and changelog (v0.4.2)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 ARCHITECTURE.md               |   2 +
 CHANGELOG.md                  |  14 +++
 CLAUDE.md                     |  17 ++++
 CONTRIBUTING.md               |   2 +
 VERSION                       |   2 +-
 gstack-upgrade/SKILL.md       |   8 +-
 gstack-upgrade/SKILL.md.tmpl  |   8 +-
 plan-ceo-review/SKILL.md      |  21 +++-
 plan-ceo-review/SKILL.md.tmpl |   4 +-
 qa/SKILL.md                   |  22 +++-
 qa/SKILL.md.tmpl              |   5 +-
 retro/SKILL.md                |  34 ++++---
 retro/SKILL.md.tmpl           |  34 ++++---
 review/SKILL.md               |  33 ++++--
 review/SKILL.md.tmpl          |  16 +--
 scripts/gen-skill-docs.ts     |  22 ++++
 ship/SKILL.md                 |  49 ++++++---
 ship/SKILL.md.tmpl            |  32 +++---
 test/gen-skill-docs.test.ts   |  21 ++++
 test/skill-e2e.test.ts        | 187 ++++++++++++++++++++++++++++++++++
 test/skill-validation.test.ts |  58 +++++++++++
 21 files changed, 514 insertions(+), 77 deletions(-)
diff --git a/ARCHITECTURE.md b/ARCHITECTURE.md
index 5311c2cd..45768d07 100644
--- a/ARCHITECTURE.md
+++ b/ARCHITECTURE.md
@@ -200,6 +200,8 @@ Templates contain the workflows, tips, and examples that require human judgment.
 | `{{SNAPSHOT_FLAGS}}` | `snapshot.ts` | Flag reference with examples |
 | `{{PREAMBLE}}` | `gen-skill-docs.ts` | Startup block: update check, session tracking, contributor mode, AskUserQuestion format |
 | `{{BROWSE_SETUP}}` | `gen-skill-docs.ts` | Binary discovery + setup instructions |
+| `{{BASE_BRANCH_DETECT}}` | `gen-skill-docs.ts` | Dynamic base branch detection for PR-targeting skills (ship, review, qa, plan-ceo-review) |
+| `{{QA_METHODOLOGY}}` | `gen-skill-docs.ts` | Shared QA methodology block for /qa and /qa-only |
 
 This is structurally sound — if a command exists in code, it appears in docs. If it doesn't exist, it can't appear.
 
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 57c2c1a0..3d67a917 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,19 @@
 # Changelog
 
+## 0.4.2 — 2026-03-16
+
+- **Skills now respect your branch target.** `/ship`, `/review`, `/qa`, and `/plan-ceo-review` detect which branch your PR actually targets instead of assuming `main`. Stacked branches, Conductor workspaces targeting feature branches, and repos using `master` all just work now.
+- **`/retro` works on any default branch.** Repos using `master`, `develop`, or other default branch names are detected automatically — no more empty retros because the branch name was wrong.
+- **New `{{BASE_BRANCH_DETECT}}` placeholder** for skill authors — drop it into any template and get 3-step branch detection (PR base → repo default → fallback) for free.
+- **3 new E2E smoke tests** validate base branch detection works end-to-end across ship, review, and retro skills.
+
+### For contributors
+
+- Added "Writing SKILL templates" section to CLAUDE.md — rules for natural language over bash-isms, dynamic branch detection, self-contained code blocks.
+- Hardcoded-main regression test scans all `.tmpl` files for git commands with hardcoded `main`.
+- QA template cleaned up: removed `REPORT_DIR` shell variable, simplified port detection to prose.
+- gstack-upgrade template: explicit cross-step prose for variable references between bash blocks.
+
 ## 0.4.1 — 2026-03-16
 
 - **gstack now notices when it screws up.** Turn on contributor mode (`gstack-config set gstack_contributor true`) and gstack automatically writes up what went wrong — what you were doing, what broke, repro steps. Next time something annoys you, the bug report is already written. Fork gstack and fix it yourself.
diff --git a/CLAUDE.md b/CLAUDE.md
index e724b826..bc21f606 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -65,6 +65,23 @@ SKILL.md files are **generated** from `.tmpl` templates. To update docs:
 To add a new browse command: add it to `browse/src/commands.ts` and rebuild.
 To add a snapshot flag: add it to `SNAPSHOT_FLAGS` in `browse/src/snapshot.ts` and rebuild.
 
+## Writing SKILL templates
+
+SKILL.md.tmpl files are **prompt templates read by Claude**, not bash scripts.
+Each bash code block runs in a separate shell — variables do not persist between blocks.
+
+Rules:
+- **Use natural language for logic and state.** Don't use shell variables to pass
+  state between code blocks. Instead, tell Claude what to remember and reference
+  it in prose (e.g., "the base branch detected in Step 0").
+- **Don't hardcode branch names.** Detect `main`/`master`/etc dynamically via
+  `gh pr view` or `gh repo view`. Use `{{BASE_BRANCH_DETECT}}` for PR-targeting
+  skills. Use "the base branch" in prose, `<base>` in code block placeholders.
+- **Keep bash blocks self-contained.** Each code block should work independently.
+  If a block needs context from a previous step, restate it in the prose above.
+- **Express conditionals as English.** Instead of nested `if/elif/else` in bash,
+  write numbered decision steps: "1. If X, do Y. 2. Otherwise, do Z."
+
 ## Browser interaction
 
 When you need to interact with a browser (QA, dogfooding, cookie setup), use the
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index abe1cf16..b06b837e 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -217,6 +217,8 @@ bun run skill:check
 bun run dev:skill
 ```
 
+For template authoring best practices (natural language over bash-isms, dynamic branch detection, `{{BASE_BRANCH_DETECT}}` usage), see CLAUDE.md's "Writing SKILL templates" section.
+
 To add a browse command, add it to `browse/src/commands.ts`. To add a snapshot flag, add it to `SNAPSHOT_FLAGS` in `browse/src/snapshot.ts`. Then rebuild.
 
 ## Conductor workspaces
diff --git a/VERSION b/VERSION
index 267577d4..2b7c5ae0 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.4.1
+0.4.2
diff --git a/gstack-upgrade/SKILL.md b/gstack-upgrade/SKILL.md
index 1cf7d548..42f13f69 100644
--- a/gstack-upgrade/SKILL.md
+++ b/gstack-upgrade/SKILL.md
@@ -94,14 +94,20 @@ fi
 echo "Install type: $INSTALL_TYPE at $INSTALL_DIR"
 ```
 
+The install type and directory path printed above will be used in all subsequent steps.
+
 ### Step 3: Save old version
 
+Use the install directory from Step 2's output below:
+
 ```bash
 OLD_VERSION=$(cat "$INSTALL_DIR/VERSION" 2>/dev/null || echo "unknown")
 ```
 
 ### Step 4: Upgrade
 
+Use the install type and directory detected in Step 2:
+
 **For git installs** (global-git, local-git):
 ```bash
 cd "$INSTALL_DIR"
@@ -125,7 +131,7 @@ rm -rf "$INSTALL_DIR.bak" "$TMP_DIR"
 
 ### Step 4.5: Sync local vendored copy
 
-After upgrading the primary install, check if there's also a local copy in the current project that needs updating:
+Use the install directory from Step 2. Check if there's also a local vendored copy that needs updating:
 
 ```bash
 _ROOT=$(git rev-parse --show-toplevel 2>/dev/null)
diff --git a/gstack-upgrade/SKILL.md.tmpl b/gstack-upgrade/SKILL.md.tmpl
index 4a124be1..a199db6c 100644
--- a/gstack-upgrade/SKILL.md.tmpl
+++ b/gstack-upgrade/SKILL.md.tmpl
@@ -92,14 +92,20 @@ fi
 echo "Install type: $INSTALL_TYPE at $INSTALL_DIR"
 ```
 
+The install type and directory path printed above will be used in all subsequent steps.
+
 ### Step 3: Save old version
 
+Use the install directory from Step 2's output below:
+
 ```bash
 OLD_VERSION=$(cat "$INSTALL_DIR/VERSION" 2>/dev/null || echo "unknown")
 ```
 
 ### Step 4: Upgrade
 
+Use the install type and directory detected in Step 2:
+
 **For git installs** (global-git, local-git):
 ```bash
 cd "$INSTALL_DIR"
@@ -123,7 +129,7 @@ rm -rf "$INSTALL_DIR.bak" "$TMP_DIR"
 
 ### Step 4.5: Sync local vendored copy
 
-After upgrading the primary install, check if there's also a local copy in the current project that needs updating:
+Use the install directory from Step 2. Check if there's also a local vendored copy that needs updating:
 
 ```bash
 _ROOT=$(git rev-parse --show-toplevel 2>/dev/null)
diff --git a/plan-ceo-review/SKILL.md b/plan-ceo-review/SKILL.md
index c82753a2..77ca6438 100644
--- a/plan-ceo-review/SKILL.md
+++ b/plan-ceo-review/SKILL.md
@@ -73,6 +73,25 @@ Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-log
 
 Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
+## Step 0: Detect base branch
+
+Determine which branch this PR targets. Use the result as "the base branch" in all subsequent steps.
+
+1. Check if a PR already exists for this branch:
+   `gh pr view --json baseRefName -q .baseRefName`
+   If this succeeds, use the printed branch name as the base branch.
+
+2. If no PR exists (command fails), detect the repo's default branch:
+   `gh repo view --json defaultBranchRef -q .defaultBranchRef.name`
+
+3. If both commands fail, fall back to `main`.
+
+Print the detected base branch name. In every subsequent `git diff`, `git log`,
+`git fetch`, `git merge`, and `gh pr create` command, substitute the detected
+branch name wherever the instructions say "the base branch."
+
+---
+
 # Mega Plan Review Mode
 
 ## Philosophy
@@ -117,7 +136,7 @@ Before doing anything else, run a system audit. This is not the plan review —
 Run the following commands:
 ```
 git log --oneline -30                          # Recent history
-git diff main --stat                           # What's already changed
+git diff <base> --stat                           # What's already changed
 git stash list                                 # Any stashed work
 grep -r "TODO\|FIXME\|HACK\|XXX" --include="*.rb" --include="*.js" -l
 find . -name "*.rb" -newer Gemfile.lock | head -20  # Recently touched files
diff --git a/plan-ceo-review/SKILL.md.tmpl b/plan-ceo-review/SKILL.md.tmpl
index ef14a281..9902fafb 100644
--- a/plan-ceo-review/SKILL.md.tmpl
+++ b/plan-ceo-review/SKILL.md.tmpl
@@ -16,6 +16,8 @@ allowed-tools:
 
 {{PREAMBLE}}
 
+{{BASE_BRANCH_DETECT}}
+
 # Mega Plan Review Mode
 
 ## Philosophy
@@ -60,7 +62,7 @@ Before doing anything else, run a system audit. This is not the plan review —
 Run the following commands:
 ```
 git log --oneline -30                          # Recent history
-git diff main --stat                           # What's already changed
+git diff <base> --stat                           # What's already changed
 git stash list                                 # Any stashed work
 grep -r "TODO\|FIXME\|HACK\|XXX" --include="*.rb" --include="*.js" -l
 find . -name "*.rb" -newer Gemfile.lock | head -20  # Recently touched files
diff --git a/qa/SKILL.md b/qa/SKILL.md
index c11f8a66..5ea4643a 100644
--- a/qa/SKILL.md
+++ b/qa/SKILL.md
@@ -77,6 +77,25 @@ Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-log
 
 Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
+## Step 0: Detect base branch
+
+Determine which branch this PR targets. Use the result as "the base branch" in all subsequent steps.
+
+1. Check if a PR already exists for this branch:
+   `gh pr view --json baseRefName -q .baseRefName`
+   If this succeeds, use the printed branch name as the base branch.
+
+2. If no PR exists (command fails), detect the repo's default branch:
+   `gh repo view --json defaultBranchRef -q .defaultBranchRef.name`
+
+3. If both commands fail, fall back to `main`.
+
+Print the detected base branch name. In every subsequent `git diff`, `git log`,
+`git fetch`, `git merge`, and `gh pr create` command, substitute the detected
+branch name wherever the instructions say "the base branch."
+
+---
+
 # /qa: Test → Fix → Verify
 
 You are a QA engineer AND a bug-fix engineer. Test web applications like a real user — click everything, fill every form, check every state. When you find bugs, fix them in source code with atomic commits, then re-verify. Produce a structured report with before/after evidence.
@@ -133,8 +152,7 @@ If `NEEDS_SETUP`:
 **Create output directories:**
 
 ```bash
-REPORT_DIR=".gstack/qa-reports"
-mkdir -p "$REPORT_DIR/screenshots"
+mkdir -p .gstack/qa-reports/screenshots
 ```
 
 ---
diff --git a/qa/SKILL.md.tmpl b/qa/SKILL.md.tmpl
index a3e5a9f0..f491999e 100644
--- a/qa/SKILL.md.tmpl
+++ b/qa/SKILL.md.tmpl
@@ -20,6 +20,8 @@ allowed-tools:
 
 {{PREAMBLE}}
 
+{{BASE_BRANCH_DETECT}}
+
 # /qa: Test → Fix → Verify
 
 You are a QA engineer AND a bug-fix engineer. Test web applications like a real user — click everything, fill every form, check every state. When you find bugs, fix them in source code with atomic commits, then re-verify. Produce a structured report with before/after evidence.
@@ -59,8 +61,7 @@ fi
 **Create output directories:**
 
 ```bash
-REPORT_DIR=".gstack/qa-reports"
-mkdir -p "$REPORT_DIR/screenshots"
+mkdir -p .gstack/qa-reports/screenshots
 ```
 
 ---
diff --git a/retro/SKILL.md b/retro/SKILL.md
index 28280c94..ca44f49e 100644
--- a/retro/SKILL.md
+++ b/retro/SKILL.md
@@ -72,6 +72,16 @@ Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-log
 
 Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
+## Detect default branch
+
+Before gathering data, detect the repo's default branch name:
+`gh repo view --json defaultBranchRef -q .defaultBranchRef.name`
+
+If this fails, fall back to `main`. Use the detected name wherever the instructions
+say `origin/<default>` below.
+
+---
+
 # /retro — Weekly Engineering Retrospective
 
 Generates a comprehensive engineering retrospective analyzing commit history, work patterns, and code quality metrics. Team-aware: identifies the user running the command, then analyzes every contributor with per-person praise and growth opportunities. Designed for a senior IC/CTO-level builder using Claude Code as a force multiplier.
@@ -106,7 +116,7 @@ Usage: /retro [window]
 
 First, fetch origin and identify the current user:
 ```bash
-git fetch origin main --quiet
+git fetch origin <default> --quiet
 # Identify who is running the retro
 git config user.name
 git config user.email
@@ -118,28 +128,28 @@ Run ALL of these git commands in parallel (they are independent):
 
 ```bash
 # 1. All commits in window with timestamps, subject, hash, AUTHOR, files changed, insertions, deletions
-git log origin/main --since="<window>" --format="%H|%aN|%ae|%ai|%s" --shortstat
+git log origin/<default> --since="<window>" --format="%H|%aN|%ae|%ai|%s" --shortstat
 
 # 2. Per-commit test vs total LOC breakdown with author
 #    Each commit block starts with COMMIT:<hash>|<author>, followed by numstat lines.
 #    Separate test files (matching test/|spec/|__tests__/) from production files.
-git log origin/main --since="<window>" --format="COMMIT:%H|%aN" --numstat
+git log origin/<default> --since="<window>" --format="COMMIT:%H|%aN" --numstat
 
 # 3. Commit timestamps for session detection and hourly distribution (with author)
 #    Use TZ=America/Los_Angeles for Pacific time conversion
-TZ=America/Los_Angeles git log origin/main --since="<window>" --format="%at|%aN|%ai|%s" | sort -n
+TZ=America/Los_Angeles git log origin/<default> --since="<window>" --format="%at|%aN|%ai|%s" | sort -n
 
 # 4. Files most frequently changed (hotspot analysis)
-git log origin/main --since="<window>" --format="" --name-only | grep -v '^$' | sort | uniq -c | sort -rn
+git log origin/<default> --since="<window>" --format="" --name-only | grep -v '^$' | sort | uniq -c | sort -rn
 
 # 5. PR numbers from commit messages (extract #NNN patterns)
-git log origin/main --since="<window>" --format="%s" | grep -oE '#[0-9]+' | sed 's/^#//' | sort -n | uniq | sed 's/^/#/'
+git log origin/<default> --since="<window>" --format="%s" | grep -oE '#[0-9]+' | sed 's/^#//' | sort -n | uniq | sed 's/^/#/'
 
 # 6. Per-author file hotspots (who touches what)
-git log origin/main --since="<window>" --format="AUTHOR:%aN" --name-only
+git log origin/<default> --since="<window>" --format="AUTHOR:%aN" --name-only
 
 # 7. Per-author commit counts (quick summary)
-git shortlog origin/main --since="<window>" -sn --no-merges
+git shortlog origin/<default> --since="<window>" -sn --no-merges
 
 # 8. Greptile triage history (if available)
 cat ~/.gstack/greptile-history.md 2>/dev/null || true
@@ -298,14 +308,14 @@ If the time window is 14 days or more, split into weekly buckets and show trends
 
 ### Step 11: Streak Tracking
 
-Count consecutive days with at least 1 commit to origin/main, going back from today. Track both team streak and personal streak:
+Count consecutive days with at least 1 commit to origin/<default>, going back from today. Track both team streak and personal streak:
 
 ```bash
 # Team streak: all unique commit dates (Pacific time) — no hard cutoff
-TZ=America/Los_Angeles git log origin/main --format="%ad" --date=format:"%Y-%m-%d" | sort -u
+TZ=America/Los_Angeles git log origin/<default> --format="%ad" --date=format:"%Y-%m-%d" | sort -u
 
 # Personal streak: only the current user's commits
-TZ=America/Los_Angeles git log origin/main --author="<user_name>" --format="%ad" --date=format:"%Y-%m-%d" | sort -u
+TZ=America/Los_Angeles git log origin/<default> --author="<user_name>" --format="%ad" --date=format:"%Y-%m-%d" | sort -u
 ```
 
 Count backward from today — how many consecutive days have at least one commit? This queries the full history so streaks of any length are reported accurately. Display both:
@@ -523,7 +533,7 @@ When the user runs `/retro compare` (or `/retro compare 14d`):
 ## Important Rules
 
 - ALL narrative output goes directly to the user in the conversation. The ONLY file written is the `.context/retros/` JSON snapshot.
-- Use `origin/main` for all git queries (not local main which may be stale)
+- Use `origin/<default>` for all git queries (not local main which may be stale)
 - Convert all timestamps to Pacific time for display (use `TZ=America/Los_Angeles`)
 - If the window has zero commits, say so and suggest a different window
 - Round LOC/hour to nearest 50
diff --git a/retro/SKILL.md.tmpl b/retro/SKILL.md.tmpl
index 07e08885..2f39fb5c 100644
--- a/retro/SKILL.md.tmpl
+++ b/retro/SKILL.md.tmpl
@@ -15,6 +15,16 @@ allowed-tools:
 
 {{PREAMBLE}}
 
+## Detect default branch
+
+Before gathering data, detect the repo's default branch name:
+`gh repo view --json defaultBranchRef -q .defaultBranchRef.name`
+
+If this fails, fall back to `main`. Use the detected name wherever the instructions
+say `origin/<default>` below.
+
+---
+
 # /retro — Weekly Engineering Retrospective
 
 Generates a comprehensive engineering retrospective analyzing commit history, work patterns, and code quality metrics. Team-aware: identifies the user running the command, then analyzes every contributor with per-person praise and growth opportunities. Designed for a senior IC/CTO-level builder using Claude Code as a force multiplier.
@@ -49,7 +59,7 @@ Usage: /retro [window]
 
 First, fetch origin and identify the current user:
 ```bash
-git fetch origin main --quiet
+git fetch origin <default> --quiet
 # Identify who is running the retro
 git config user.name
 git config user.email
@@ -61,28 +71,28 @@ Run ALL of these git commands in parallel (they are independent):
 
 ```bash
 # 1. All commits in window with timestamps, subject, hash, AUTHOR, files changed, insertions, deletions
-git log origin/main --since="<window>" --format="%H|%aN|%ae|%ai|%s" --shortstat
+git log origin/<default> --since="<window>" --format="%H|%aN|%ae|%ai|%s" --shortstat
 
 # 2. Per-commit test vs total LOC breakdown with author
 #    Each commit block starts with COMMIT:<hash>|<author>, followed by numstat lines.
 #    Separate test files (matching test/|spec/|__tests__/) from production files.
-git log origin/main --since="<window>" --format="COMMIT:%H|%aN" --numstat
+git log origin/<default> --since="<window>" --format="COMMIT:%H|%aN" --numstat
 
 # 3. Commit timestamps for session detection and hourly distribution (with author)
 #    Use TZ=America/Los_Angeles for Pacific time conversion
-TZ=America/Los_Angeles git log origin/main --since="<window>" --format="%at|%aN|%ai|%s" | sort -n
+TZ=America/Los_Angeles git log origin/<default> --since="<window>" --format="%at|%aN|%ai|%s" | sort -n
 
 # 4. Files most frequently changed (hotspot analysis)
-git log origin/main --since="<window>" --format="" --name-only | grep -v '^$' | sort | uniq -c | sort -rn
+git log origin/<default> --since="<window>" --format="" --name-only | grep -v '^$' | sort | uniq -c | sort -rn
 
 # 5. PR numbers from commit messages (extract #NNN patterns)
-git log origin/main --since="<window>" --format="%s" | grep -oE '#[0-9]+' | sed 's/^#//' | sort -n | uniq | sed 's/^/#/'
+git log origin/<default> --since="<window>" --format="%s" | grep -oE '#[0-9]+' | sed 's/^#//' | sort -n | uniq | sed 's/^/#/'
 
 # 6. Per-author file hotspots (who touches what)
-git log origin/main --since="<window>" --format="AUTHOR:%aN" --name-only
+git log origin/<default> --since="<window>" --format="AUTHOR:%aN" --name-only
 
 # 7. Per-author commit counts (quick summary)
-git shortlog origin/main --since="<window>" -sn --no-merges
+git shortlog origin/<default> --since="<window>" -sn --no-merges
 
 # 8. Greptile triage history (if available)
 cat ~/.gstack/greptile-history.md 2>/dev/null || true
@@ -241,14 +251,14 @@ If the time window is 14 days or more, split into weekly buckets and show trends
 
 ### Step 11: Streak Tracking
 
-Count consecutive days with at least 1 commit to origin/main, going back from today. Track both team streak and personal streak:
+Count consecutive days with at least 1 commit to origin/<default>, going back from today. Track both team streak and personal streak:
 
 ```bash
 # Team streak: all unique commit dates (Pacific time) — no hard cutoff
-TZ=America/Los_Angeles git log origin/main --format="%ad" --date=format:"%Y-%m-%d" | sort -u
+TZ=America/Los_Angeles git log origin/<default> --format="%ad" --date=format:"%Y-%m-%d" | sort -u
 
 # Personal streak: only the current user's commits
-TZ=America/Los_Angeles git log origin/main --author="<user_name>" --format="%ad" --date=format:"%Y-%m-%d" | sort -u
+TZ=America/Los_Angeles git log origin/<default> --author="<user_name>" --format="%ad" --date=format:"%Y-%m-%d" | sort -u
 ```
 
 Count backward from today — how many consecutive days have at least one commit? This queries the full history so streaks of any length are reported accurately. Display both:
@@ -466,7 +476,7 @@ When the user runs `/retro compare` (or `/retro compare 14d`):
 ## Important Rules
 
 - ALL narrative output goes directly to the user in the conversation. The ONLY file written is the `.context/retros/` JSON snapshot.
-- Use `origin/main` for all git queries (not local main which may be stale)
+- Use `origin/<default>` for all git queries (not local main which may be stale)
 - Convert all timestamps to Pacific time for display (use `TZ=America/Los_Angeles`)
 - If the window has zero commits, say so and suggest a different window
 - Round LOC/hour to nearest 50
diff --git a/review/SKILL.md b/review/SKILL.md
index 32c597a3..949a0c65 100644
--- a/review/SKILL.md
+++ b/review/SKILL.md
@@ -2,7 +2,7 @@
 name: review
 version: 1.0.0
 description: |
-  Pre-landing PR review. Analyzes diff against main for SQL safety, LLM trust
+  Pre-landing PR review. Analyzes diff against the base branch for SQL safety, LLM trust
   boundary violations, conditional side effects, and other structural issues.
 allowed-tools:
   - Bash
@@ -73,17 +73,36 @@ Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-log
 
 Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
+## Step 0: Detect base branch
+
+Determine which branch this PR targets. Use the result as "the base branch" in all subsequent steps.
+
+1. Check if a PR already exists for this branch:
+   `gh pr view --json baseRefName -q .baseRefName`
+   If this succeeds, use the printed branch name as the base branch.
+
+2. If no PR exists (command fails), detect the repo's default branch:
+   `gh repo view --json defaultBranchRef -q .defaultBranchRef.name`
+
+3. If both commands fail, fall back to `main`.
+
+Print the detected base branch name. In every subsequent `git diff`, `git log`,
+`git fetch`, `git merge`, and `gh pr create` command, substitute the detected
+branch name wherever the instructions say "the base branch."
+
+---
+
 # Pre-Landing PR Review
 
-You are running the `/review` workflow. Analyze the current branch's diff against main for structural issues that tests don't catch.
+You are running the `/review` workflow. Analyze the current branch's diff against the base branch for structural issues that tests don't catch.
 
 ---
 
 ## Step 1: Check branch
 
 1. Run `git branch --show-current` to get the current branch.
-2. If on `main`, output: **"Nothing to review — you're on main or have no changes against main."** and stop.
-3. Run `git fetch origin main --quiet && git diff origin/main --stat` to check if there's a diff. If no diff, output the same message and stop.
+2. If on the base branch, output: **"Nothing to review — you're on the base branch or have no changes against it."** and stop.
+3. Run `git fetch origin <base> --quiet && git diff origin/<base> --stat` to check if there's a diff. If no diff, output the same message and stop.
 
 ---
 
@@ -107,13 +126,13 @@ Read `.claude/skills/review/greptile-triage.md` and follow the fetch, filter, cl
 
 ## Step 3: Get the diff
 
-Fetch the latest main to avoid false positives from a stale local main:
+Fetch the latest base branch to avoid false positives from stale local state:
 
 ```bash
-git fetch origin main --quiet
+git fetch origin <base> --quiet
 ```
 
-Run `git diff origin/main` to get the full diff. This includes both committed and uncommitted changes against the latest main.
+Run `git diff origin/<base>` to get the full diff. This includes both committed and uncommitted changes against the latest base branch.
 
 ---
 
diff --git a/review/SKILL.md.tmpl b/review/SKILL.md.tmpl
index 124a5393..dadd211a 100644
--- a/review/SKILL.md.tmpl
+++ b/review/SKILL.md.tmpl
@@ -2,7 +2,7 @@
 name: review
 version: 1.0.0
 description: |
-  Pre-landing PR review. Analyzes diff against main for SQL safety, LLM trust
+  Pre-landing PR review. Analyzes diff against the base branch for SQL safety, LLM trust
   boundary violations, conditional side effects, and other structural issues.
 allowed-tools:
   - Bash
@@ -16,17 +16,19 @@ allowed-tools:
 
 {{PREAMBLE}}
 
+{{BASE_BRANCH_DETECT}}
+
 # Pre-Landing PR Review
 
-You are running the `/review` workflow. Analyze the current branch's diff against main for structural issues that tests don't catch.
+You are running the `/review` workflow. Analyze the current branch's diff against the base branch for structural issues that tests don't catch.
 
 ---
 
 ## Step 1: Check branch
 
 1. Run `git branch --show-current` to get the current branch.
-2. If on `main`, output: **"Nothing to review — you're on main or have no changes against main."** and stop.
-3. Run `git fetch origin main --quiet && git diff origin/main --stat` to check if there's a diff. If no diff, output the same message and stop.
+2. If on the base branch, output: **"Nothing to review — you're on the base branch or have no changes against it."** and stop.
+3. Run `git fetch origin <base> --quiet && git diff origin/<base> --stat` to check if there's a diff. If no diff, output the same message and stop.
 
 ---
 
@@ -50,13 +52,13 @@ Read `.claude/skills/review/greptile-triage.md` and follow the fetch, filter, cl
 
 ## Step 3: Get the diff
 
-Fetch the latest main to avoid false positives from a stale local main:
+Fetch the latest base branch to avoid false positives from stale local state:
 
 ```bash
-git fetch origin main --quiet
+git fetch origin <base> --quiet
 ```
 
-Run `git diff origin/main` to get the full diff. This includes both committed and uncommitted changes against the latest main.
+Run `git diff origin/<base>` to get the full diff. This includes both committed and uncommitted changes against the latest base branch.
 
 ---
 
diff --git a/scripts/gen-skill-docs.ts b/scripts/gen-skill-docs.ts
index bafed642..9c81e968 100644
--- a/scripts/gen-skill-docs.ts
+++ b/scripts/gen-skill-docs.ts
@@ -174,6 +174,27 @@ If \`NEEDS_SETUP\`:
 3. If \`bun\` is not installed: \`curl -fsSL https://bun.sh/install | bash\``;
 }
 
+function generateBaseBranchDetect(): string {
+  return `## Step 0: Detect base branch
+
+Determine which branch this PR targets. Use the result as "the base branch" in all subsequent steps.
+
+1. Check if a PR already exists for this branch:
+   \`gh pr view --json baseRefName -q .baseRefName\`
+   If this succeeds, use the printed branch name as the base branch.
+
+2. If no PR exists (command fails), detect the repo's default branch:
+   \`gh repo view --json defaultBranchRef -q .defaultBranchRef.name\`
+
+3. If both commands fail, fall back to \`main\`.
+
+Print the detected base branch name. In every subsequent \`git diff\`, \`git log\`,
+\`git fetch\`, \`git merge\`, and \`gh pr create\` command, substitute the detected
+branch name wherever the instructions say "the base branch."
+
+---`;
+}
+
 function generateQAMethodology(): string {
   return `## Modes
 
@@ -455,6 +476,7 @@ const RESOLVERS: Record<string, () => string> = {
   SNAPSHOT_FLAGS: generateSnapshotFlags,
   PREAMBLE: generatePreamble,
   BROWSE_SETUP: generateBrowseSetup,
+  BASE_BRANCH_DETECT: generateBaseBranchDetect,
   QA_METHODOLOGY: generateQAMethodology,
 };
 
diff --git a/ship/SKILL.md b/ship/SKILL.md
index e023816d..47a9da11 100644
--- a/ship/SKILL.md
+++ b/ship/SKILL.md
@@ -2,7 +2,7 @@
 name: ship
 version: 1.0.0
 description: |
-  Ship workflow: merge main, run tests, review diff, bump VERSION, update CHANGELOG, commit, push, create PR.
+  Ship workflow: detect + merge base branch, run tests, review diff, bump VERSION, update CHANGELOG, commit, push, create PR.
 allowed-tools:
   - Bash
   - Read
@@ -72,12 +72,31 @@ Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-log
 
 Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
+## Step 0: Detect base branch
+
+Determine which branch this PR targets. Use the result as "the base branch" in all subsequent steps.
+
+1. Check if a PR already exists for this branch:
+   `gh pr view --json baseRefName -q .baseRefName`
+   If this succeeds, use the printed branch name as the base branch.
+
+2. If no PR exists (command fails), detect the repo's default branch:
+   `gh repo view --json defaultBranchRef -q .defaultBranchRef.name`
+
+3. If both commands fail, fall back to `main`.
+
+Print the detected base branch name. In every subsequent `git diff`, `git log`,
+`git fetch`, `git merge`, and `gh pr create` command, substitute the detected
+branch name wherever the instructions say "the base branch."
+
+---
+
 # Ship: Fully Automated Ship Workflow
 
 You are running the `/ship` workflow. This is a **non-interactive, fully automated** workflow. Do NOT ask for confirmation at any step. The user said `/ship` which means DO IT. Run straight through and output the PR URL at the end.
 
 **Only stop for:**
-- On `main` branch (abort)
+- On the base branch (abort)
 - Merge conflicts that can't be auto-resolved (stop, show conflicts)
 - Test failures (stop, show failures)
 - Pre-landing review finds CRITICAL issues and user chooses to fix (not acknowledge or skip)
@@ -98,20 +117,20 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 
 ## Step 1: Pre-flight
 
-1. Check the current branch. If on `main`, **abort**: "You're on main. Ship from a feature branch."
+1. Check the current branch. If on the base branch or the repo's default branch, **abort**: "You're on the base branch. Ship from a feature branch."
 
 2. Run `git status` (never use `-uall`). Uncommitted changes are always included — no need to ask.
 
-3. Run `git diff main...HEAD --stat` and `git log main..HEAD --oneline` to understand what's being shipped.
+3. Run `git diff <base>...HEAD --stat` and `git log <base>..HEAD --oneline` to understand what's being shipped.
 
 ---
 
-## Step 2: Merge origin/main (BEFORE tests)
+## Step 2: Merge the base branch (BEFORE tests)
 
-Fetch and merge `origin/main` into the feature branch so tests run against the merged state:
+Fetch and merge the base branch into the feature branch so tests run against the merged state:
 
 ```bash
-git fetch origin main && git merge origin/main --no-edit
+git fetch origin <base> && git merge origin/<base> --no-edit
 ```
 
 **If there are merge conflicts:** Try to auto-resolve if they are simple (VERSION, schema.rb, CHANGELOG ordering). If conflicts are complex or ambiguous, **STOP** and show them.
@@ -149,7 +168,7 @@ Evals are mandatory when prompt-related files change. Skip this step entirely if
 **1. Check if the diff touches prompt-related files:**
 
 ```bash
-git diff origin/main --name-only
+git diff origin/<base> --name-only
 ```
 
 Match against these patterns (from CLAUDE.md):
@@ -210,7 +229,7 @@ Review the diff for structural issues that tests don't catch.
 
 1. Read `.claude/skills/review/checklist.md`. If the file cannot be read, **STOP** and report the error.
 
-2. Run `git diff origin/main` to get the full diff (scoped to feature changes against the freshly-fetched remote main).
+2. Run `git diff origin/<base>` to get the full diff (scoped to feature changes against the freshly-fetched base branch).
 
 3. Apply the review checklist in two passes:
    - **Pass 1 (CRITICAL):** SQL & Data Safety, LLM Output Trust Boundary
@@ -278,7 +297,7 @@ For each classified comment:
 1. Read the current `VERSION` file (4-digit format: `MAJOR.MINOR.PATCH.MICRO`)
 
 2. **Auto-decide the bump level based on the diff:**
-   - Count lines changed (`git diff origin/main...HEAD --stat | tail -1`)
+   - Count lines changed (`git diff origin/<base>...HEAD --stat | tail -1`)
    - **MICRO** (4th digit): < 50 lines changed, trivial tweaks, typos, config
    - **PATCH** (3rd digit): 50+ lines changed, bug fixes, small-medium features
    - **MINOR** (2nd digit): **ASK the user** — only for major features or significant architectural changes
@@ -297,8 +316,8 @@ For each classified comment:
 1. Read `CHANGELOG.md` header to know the format.
 
 2. Auto-generate the entry from **ALL commits on the branch** (not just recent ones):
-   - Use `git log main..HEAD --oneline` to see every commit being shipped
-   - Use `git diff main...HEAD` to see the full diff against main
+   - Use `git log <base>..HEAD --oneline` to see every commit being shipped
+   - Use `git diff <base>...HEAD` to see the full diff against the base branch
    - The CHANGELOG entry must be comprehensive of ALL changes going into the PR
    - If existing CHANGELOG entries on the branch already cover some commits, replace them with one unified entry for the new version
    - Categorize changes into applicable sections:
@@ -346,8 +365,8 @@ Read TODOS.md and verify it follows the recommended structure:
 This step is fully automatic — no user interaction.
 
 Use the diff and commit history already gathered in earlier steps:
-- `git diff main...HEAD` (full diff against main)
-- `git log main..HEAD --oneline` (all commits being shipped)
+- `git diff <base>...HEAD` (full diff against the base branch)
+- `git log <base>..HEAD --oneline` (all commits being shipped)
 
 For each TODO item, check if the changes in this PR complete it by:
 - Matching commit messages against the TODO title and description
@@ -422,7 +441,7 @@ git push -u origin <branch-name>
 Create a pull request using `gh`:
 
 ```bash
-gh pr create --title "<type>: <summary>" --body "$(cat <<'EOF'
+gh pr create --base <base> --title "<type>: <summary>" --body "$(cat <<'EOF'
 ## Summary
 <bullet points from CHANGELOG>
 
diff --git a/ship/SKILL.md.tmpl b/ship/SKILL.md.tmpl
index 06ff5a07..ae5df404 100644
--- a/ship/SKILL.md.tmpl
+++ b/ship/SKILL.md.tmpl
@@ -2,7 +2,7 @@
 name: ship
 version: 1.0.0
 description: |
-  Ship workflow: merge main, run tests, review diff, bump VERSION, update CHANGELOG, commit, push, create PR.
+  Ship workflow: detect + merge base branch, run tests, review diff, bump VERSION, update CHANGELOG, commit, push, create PR.
 allowed-tools:
   - Bash
   - Read
@@ -15,12 +15,14 @@ allowed-tools:
 
 {{PREAMBLE}}
 
+{{BASE_BRANCH_DETECT}}
+
 # Ship: Fully Automated Ship Workflow
 
 You are running the `/ship` workflow. This is a **non-interactive, fully automated** workflow. Do NOT ask for confirmation at any step. The user said `/ship` which means DO IT. Run straight through and output the PR URL at the end.
 
 **Only stop for:**
-- On `main` branch (abort)
+- On the base branch (abort)
 - Merge conflicts that can't be auto-resolved (stop, show conflicts)
 - Test failures (stop, show failures)
 - Pre-landing review finds CRITICAL issues and user chooses to fix (not acknowledge or skip)
@@ -41,20 +43,20 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 
 ## Step 1: Pre-flight
 
-1. Check the current branch. If on `main`, **abort**: "You're on main. Ship from a feature branch."
+1. Check the current branch. If on the base branch or the repo's default branch, **abort**: "You're on the base branch. Ship from a feature branch."
 
 2. Run `git status` (never use `-uall`). Uncommitted changes are always included — no need to ask.
 
-3. Run `git diff main...HEAD --stat` and `git log main..HEAD --oneline` to understand what's being shipped.
+3. Run `git diff <base>...HEAD --stat` and `git log <base>..HEAD --oneline` to understand what's being shipped.
 
 ---
 
-## Step 2: Merge origin/main (BEFORE tests)
+## Step 2: Merge the base branch (BEFORE tests)
 
-Fetch and merge `origin/main` into the feature branch so tests run against the merged state:
+Fetch and merge the base branch into the feature branch so tests run against the merged state:
 
 ```bash
-git fetch origin main && git merge origin/main --no-edit
+git fetch origin <base> && git merge origin/<base> --no-edit
 ```
 
 **If there are merge conflicts:** Try to auto-resolve if they are simple (VERSION, schema.rb, CHANGELOG ordering). If conflicts are complex or ambiguous, **STOP** and show them.
@@ -92,7 +94,7 @@ Evals are mandatory when prompt-related files change. Skip this step entirely if
 **1. Check if the diff touches prompt-related files:**
 
 ```bash
-git diff origin/main --name-only
+git diff origin/<base> --name-only
 ```
 
 Match against these patterns (from CLAUDE.md):
@@ -153,7 +155,7 @@ Review the diff for structural issues that tests don't catch.
 
 1. Read `.claude/skills/review/checklist.md`. If the file cannot be read, **STOP** and report the error.
 
-2. Run `git diff origin/main` to get the full diff (scoped to feature changes against the freshly-fetched remote main).
+2. Run `git diff origin/<base>` to get the full diff (scoped to feature changes against the freshly-fetched base branch).
 
 3. Apply the review checklist in two passes:
    - **Pass 1 (CRITICAL):** SQL & Data Safety, LLM Output Trust Boundary
@@ -221,7 +223,7 @@ For each classified comment:
 1. Read the current `VERSION` file (4-digit format: `MAJOR.MINOR.PATCH.MICRO`)
 
 2. **Auto-decide the bump level based on the diff:**
-   - Count lines changed (`git diff origin/main...HEAD --stat | tail -1`)
+   - Count lines changed (`git diff origin/<base>...HEAD --stat | tail -1`)
    - **MICRO** (4th digit): < 50 lines changed, trivial tweaks, typos, config
    - **PATCH** (3rd digit): 50+ lines changed, bug fixes, small-medium features
    - **MINOR** (2nd digit): **ASK the user** — only for major features or significant architectural changes
@@ -240,8 +242,8 @@ For each classified comment:
 1. Read `CHANGELOG.md` header to know the format.
 
 2. Auto-generate the entry from **ALL commits on the branch** (not just recent ones):
-   - Use `git log main..HEAD --oneline` to see every commit being shipped
-   - Use `git diff main...HEAD` to see the full diff against main
+   - Use `git log <base>..HEAD --oneline` to see every commit being shipped
+   - Use `git diff <base>...HEAD` to see the full diff against the base branch
    - The CHANGELOG entry must be comprehensive of ALL changes going into the PR
    - If existing CHANGELOG entries on the branch already cover some commits, replace them with one unified entry for the new version
    - Categorize changes into applicable sections:
@@ -289,8 +291,8 @@ Read TODOS.md and verify it follows the recommended structure:
 This step is fully automatic — no user interaction.
 
 Use the diff and commit history already gathered in earlier steps:
-- `git diff main...HEAD` (full diff against main)
-- `git log main..HEAD --oneline` (all commits being shipped)
+- `git diff <base>...HEAD` (full diff against the base branch)
+- `git log <base>..HEAD --oneline` (all commits being shipped)
 
 For each TODO item, check if the changes in this PR complete it by:
 - Matching commit messages against the TODO title and description
@@ -365,7 +367,7 @@ git push -u origin <branch-name>
 Create a pull request using `gh`:
 
 ```bash
-gh pr create --title "<type>: <summary>" --body "$(cat <<'EOF'
+gh pr create --base <base> --title "<type>: <summary>" --body "$(cat <<'EOF'
 ## Summary
 <bullet points from CHANGELOG>
 
diff --git a/test/gen-skill-docs.test.ts b/test/gen-skill-docs.test.ts
index a2499af6..e77989f0 100644
--- a/test/gen-skill-docs.test.ts
+++ b/test/gen-skill-docs.test.ts
@@ -203,6 +203,27 @@ describe('gen-skill-docs', () => {
   });
 });
 
+describe('BASE_BRANCH_DETECT resolver', () => {
+  // Find a generated SKILL.md that uses the placeholder (ship is guaranteed to)
+  const shipContent = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+
+  test('resolver output contains PR base detection command', () => {
+    expect(shipContent).toContain('gh pr view --json baseRefName');
+  });
+
+  test('resolver output contains repo default branch detection command', () => {
+    expect(shipContent).toContain('gh repo view --json defaultBranchRef');
+  });
+
+  test('resolver output contains fallback to main', () => {
+    expect(shipContent).toMatch(/fall\s*back\s+to\s+`main`/i);
+  });
+
+  test('resolver output uses "the base branch" phrasing', () => {
+    expect(shipContent).toContain('the base branch');
+  });
+});
+
 /**
  * Quality evals — catch description regressions.
  *
diff --git a/test/skill-e2e.test.ts b/test/skill-e2e.test.ts
index 8ce1f40f..4978ce53 100644
--- a/test/skill-e2e.test.ts
+++ b/test/skill-e2e.test.ts
@@ -1344,6 +1344,193 @@ Write your review to ${planDir}/review-output.md`,
   }, 420_000);
 });
 
+// --- Base branch detection smoke tests ---
+
+describeE2E('Base branch detection', () => {
+  let baseBranchDir: string;
+  const run = (cmd: string, args: string[], cwd: string) =>
+    spawnSync(cmd, args, { cwd, stdio: 'pipe', timeout: 5000 });
+
+  beforeAll(() => {
+    baseBranchDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-basebranch-'));
+  });
+
+  afterAll(() => {
+    try { fs.rmSync(baseBranchDir, { recursive: true, force: true }); } catch {}
+  });
+
+  test('/review detects base branch and diffs against it', async () => {
+    const dir = path.join(baseBranchDir, 'review-base');
+    fs.mkdirSync(dir, { recursive: true });
+
+    // Create git repo with a feature branch off main
+    run('git', ['init'], dir);
+    run('git', ['config', 'user.email', 'test@test.com'], dir);
+    run('git', ['config', 'user.name', 'Test'], dir);
+
+    fs.writeFileSync(path.join(dir, 'app.rb'), '# clean base\nclass App\nend\n');
+    run('git', ['add', 'app.rb'], dir);
+    run('git', ['commit', '-m', 'initial commit'], dir);
+
+    // Create feature branch with a change
+    run('git', ['checkout', '-b', 'feature/test-review'], dir);
+    fs.writeFileSync(path.join(dir, 'app.rb'), '# clean base\nclass App\n  def hello; "world"; end\nend\n');
+    run('git', ['add', 'app.rb'], dir);
+    run('git', ['commit', '-m', 'feat: add hello method'], dir);
+
+    // Copy review skill files
+    fs.copyFileSync(path.join(ROOT, 'review', 'SKILL.md'), path.join(dir, 'review-SKILL.md'));
+    fs.copyFileSync(path.join(ROOT, 'review', 'checklist.md'), path.join(dir, 'review-checklist.md'));
+    fs.copyFileSync(path.join(ROOT, 'review', 'greptile-triage.md'), path.join(dir, 'review-greptile-triage.md'));
+
+    const result = await runSkillTest({
+      prompt: `You are in a git repo on a feature branch with changes.
+Read review-SKILL.md for the review workflow instructions.
+Also read review-checklist.md and apply it.
+
+IMPORTANT: Follow Step 0 to detect the base branch. Since there is no remote, gh commands will fail — fall back to main.
+Then run the review against the detected base branch.
+Write your findings to ${dir}/review-output.md`,
+      workingDirectory: dir,
+      maxTurns: 15,
+      timeout: 90_000,
+      testName: 'review-base-branch',
+      runId,
+    });
+
+    logCost('/review base-branch', result);
+    recordE2E('/review base branch detection', 'Base branch detection', result);
+    expect(result.exitReason).toBe('success');
+
+    // Verify the review used "base branch" language (from Step 0)
+    const toolOutputs = result.toolCalls.map(tc => tc.output || '').join('\n');
+    const allOutput = (result.output || '') + toolOutputs;
+    // The agent should have run git diff against main (the fallback)
+    const usedGitDiff = result.toolCalls.some(tc =>
+      tc.tool === 'Bash' && typeof tc.input === 'string' && tc.input.includes('git diff')
+    );
+    expect(usedGitDiff).toBe(true);
+  }, 120_000);
+
+  test('/ship Step 0-1 detects base branch without destructive actions', async () => {
+    const dir = path.join(baseBranchDir, 'ship-base');
+    fs.mkdirSync(dir, { recursive: true });
+
+    // Create git repo with feature branch
+    run('git', ['init'], dir);
+    run('git', ['config', 'user.email', 'test@test.com'], dir);
+    run('git', ['config', 'user.name', 'Test'], dir);
+
+    fs.writeFileSync(path.join(dir, 'app.ts'), 'console.log("v1");\n');
+    run('git', ['add', 'app.ts'], dir);
+    run('git', ['commit', '-m', 'initial'], dir);
+
+    run('git', ['checkout', '-b', 'feature/ship-test'], dir);
+    fs.writeFileSync(path.join(dir, 'app.ts'), 'console.log("v2");\n');
+    run('git', ['add', 'app.ts'], dir);
+    run('git', ['commit', '-m', 'feat: update to v2'], dir);
+
+    // Copy ship skill
+    fs.copyFileSync(path.join(ROOT, 'ship', 'SKILL.md'), path.join(dir, 'ship-SKILL.md'));
+
+    const result = await runSkillTest({
+      prompt: `Read ship-SKILL.md for the ship workflow.
+
+Run ONLY Step 0 (Detect base branch) and Step 1 (Pre-flight) from the ship workflow.
+Since there is no remote, gh commands will fail — fall back to main.
+
+After completing Step 0 and Step 1, STOP. Do NOT proceed to Step 2 or beyond.
+Do NOT push, create PRs, or modify VERSION/CHANGELOG.
+
+Write a summary of what you detected to ${dir}/ship-preflight.md including:
+- The detected base branch name
+- The current branch name
+- The diff stat against the base branch`,
+      workingDirectory: dir,
+      maxTurns: 10,
+      timeout: 60_000,
+      testName: 'ship-base-branch',
+      runId,
+    });
+
+    logCost('/ship base-branch', result);
+    recordE2E('/ship base branch detection', 'Base branch detection', result);
+    expect(result.exitReason).toBe('success');
+
+    // Verify preflight output was written
+    const preflightPath = path.join(dir, 'ship-preflight.md');
+    if (fs.existsSync(preflightPath)) {
+      const content = fs.readFileSync(preflightPath, 'utf-8');
+      expect(content.length).toBeGreaterThan(20);
+      // Should mention the branch name
+      expect(content.toLowerCase()).toMatch(/main|base/);
+    }
+
+    // Verify no destructive actions — no push, no PR creation
+    const destructiveTools = result.toolCalls.filter(tc =>
+      tc.tool === 'Bash' && typeof tc.input === 'string' &&
+      (tc.input.includes('git push') || tc.input.includes('gh pr create'))
+    );
+    expect(destructiveTools).toHaveLength(0);
+  }, 90_000);
+
+  test('/retro detects default branch for git queries', async () => {
+    const dir = path.join(baseBranchDir, 'retro-base');
+    fs.mkdirSync(dir, { recursive: true });
+
+    // Create git repo with commit history
+    run('git', ['init'], dir);
+    run('git', ['config', 'user.email', 'dev@example.com'], dir);
+    run('git', ['config', 'user.name', 'Dev'], dir);
+
+    fs.writeFileSync(path.join(dir, 'app.ts'), 'console.log("hello");\n');
+    run('git', ['add', 'app.ts'], dir);
+    run('git', ['commit', '-m', 'feat: initial app', '--date', '2026-03-14T09:00:00'], dir);
+
+    fs.writeFileSync(path.join(dir, 'auth.ts'), 'export function login() {}\n');
+    run('git', ['add', 'auth.ts'], dir);
+    run('git', ['commit', '-m', 'feat: add auth', '--date', '2026-03-15T10:00:00'], dir);
+
+    fs.writeFileSync(path.join(dir, 'test.ts'), 'test("it works", () => {});\n');
+    run('git', ['add', 'test.ts'], dir);
+    run('git', ['commit', '-m', 'test: add tests', '--date', '2026-03-16T11:00:00'], dir);
+
+    // Copy retro skill
+    fs.mkdirSync(path.join(dir, 'retro'), { recursive: true });
+    fs.copyFileSync(path.join(ROOT, 'retro', 'SKILL.md'), path.join(dir, 'retro', 'SKILL.md'));
+
+    const result = await runSkillTest({
+      prompt: `Read retro/SKILL.md for instructions on how to run a retrospective.
+
+IMPORTANT: Follow the "Detect default branch" step first. Since there is no remote, gh will fail — fall back to main.
+Then use the detected branch name for all git queries.
+
+Run /retro for the last 7 days of this git repo. Skip any AskUserQuestion calls — this is non-interactive.
+This is a local-only repo so use the local branch (main) instead of origin/main for all git log commands.
+
+Write your retrospective to ${dir}/retro-output.md`,
+      workingDirectory: dir,
+      maxTurns: 25,
+      timeout: 240_000,
+      testName: 'retro-base-branch',
+      runId,
+    });
+
+    logCost('/retro base-branch', result);
+    recordE2E('/retro default branch detection', 'Base branch detection', result, {
+      passed: ['success', 'error_max_turns'].includes(result.exitReason),
+    });
+    expect(['success', 'error_max_turns']).toContain(result.exitReason);
+
+    // Verify retro output was produced
+    const retroPath = path.join(dir, 'retro-output.md');
+    if (fs.existsSync(retroPath)) {
+      const content = fs.readFileSync(retroPath, 'utf-8');
+      expect(content.length).toBeGreaterThan(100);
+    }
+  }, 300_000);
+});
+
 // --- Deferred skill E2E tests (destructive or require interactive UI) ---
 
 describeE2E('Deferred skill E2E', () => {
diff --git a/test/skill-validation.test.ts b/test/skill-validation.test.ts
index 88e98935..2a947b15 100644
--- a/test/skill-validation.test.ts
+++ b/test/skill-validation.test.ts
@@ -388,6 +388,64 @@ describe('Greptile history format consistency', () => {
   });
 });
 
+// --- Hardcoded branch name detection in templates ---
+
+describe('No hardcoded branch names in SKILL templates', () => {
+  const tmplFiles = [
+    'ship/SKILL.md.tmpl',
+    'review/SKILL.md.tmpl',
+    'qa/SKILL.md.tmpl',
+    'plan-ceo-review/SKILL.md.tmpl',
+    'retro/SKILL.md.tmpl',
+  ];
+
+  // Patterns that indicate hardcoded 'main' in git commands
+  const gitMainPatterns = [
+    /\bgit\s+diff\s+(?:origin\/)?main\b/,
+    /\bgit\s+log\s+(?:origin\/)?main\b/,
+    /\bgit\s+fetch\s+origin\s+main\b/,
+    /\bgit\s+merge\s+origin\/main\b/,
+    /\borigin\/main\b/,
+  ];
+
+  // Lines that are allowed to mention 'main' (fallback logic, prose)
+  const allowlist = [
+    /fall\s*back\s+to\s+`main`/i,
+    /fall\s*back\s+to\s+`?main`?/i,
+    /typically\s+`?main`?/i,
+    /If\s+on\s+`main`/i,  // old pattern — should not exist
+  ];
+
+  for (const tmplFile of tmplFiles) {
+    test(`${tmplFile} has no hardcoded 'main' in git commands`, () => {
+      const filePath = path.join(ROOT, tmplFile);
+      if (!fs.existsSync(filePath)) return;
+      const lines = fs.readFileSync(filePath, 'utf-8').split('\n');
+      const violations: string[] = [];
+
+      for (let i = 0; i < lines.length; i++) {
+        const line = lines[i];
+        const isAllowlisted = allowlist.some(p => p.test(line));
+        if (isAllowlisted) continue;
+
+        for (const pattern of gitMainPatterns) {
+          if (pattern.test(line)) {
+            violations.push(`Line ${i + 1}: ${line.trim()}`);
+            break;
+          }
+        }
+      }
+
+      if (violations.length > 0) {
+        throw new Error(
+          `${tmplFile} has hardcoded 'main' in git commands:\n` +
+          violations.map(v => `  ${v}`).join('\n')
+        );
+      }
+    });
+  }
+});
+
 // --- Part 7b: TODOS-format.md reference consistency ---
 
 describe('TODOS-format.md reference consistency', () => {

From 78e519e3b763680ba483aa606d7e2cfbadb1952f Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Mon, 16 Mar 2026 11:28:58 -0500
Subject: [PATCH 02/22] feat: await support in browse js/eval + contributor
 mode v2 (#104)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* feat: support await in $B js and eval commands

Auto-wrap await expressions in async IIFE context so
$B js "await fetch(...)" works without SyntaxError.

- hasAwait() strips comments before detection
- js: expression wrapping (async()=>(expr))()
- eval: smart wrapping — single-line=expression, multi-line=block
- 6 new unit tests covering async, false-positive, and return semantics

* feat: redesign contributor mode — periodic reflection with 0-10 rating

Replace passive "report when things break" with active reflection:
- Rate gstack experience 0-10 at workflow step boundaries
- Historical calibration example (await bug) anchors the reporting bar
- "What would make this a 10" field focuses on actionable improvements
- Removed category lists in favor of judgment-based assessment

* test: add deterministic contributor mode preamble validation

40 new skill-validation tests (4 checks × 10 skills) verify:
- 0-10 rating scale present
- Calibration example present
- "What would make this a 10" field present
- Periodic reflection (not per-command)

Update existing E2E contributor eval for new report format.

* chore: bump version and changelog (v0.4.2)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* fix: improve contributor mode + qa-quick E2E reliability

Contributor mode:
- Add "do not truncate" directive to template — agent was stopping
  after "My rating" without completing Steps/Raw output/What would
  make this a 10 sections
- Restore assertions for Steps to reproduce and Date footer

QA quick:
- Make test server URL prominent: top of prompt, explicit "already
  running" and "do NOT discover ports" instructions
- Bump session timeout 180s→240s and test timeout 240s→300s
- Set B= at top of prompt (was buried in prose)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* fix: use flexible assertions for contributor mode E2E

Agent writes thorough reports with creative section names
("Repro Steps" vs "Steps to reproduce"). Match intent not formatting:
- /repro|steps to reproduce/ for reproduction steps
- /date.*2026/ for date footer presence

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* docs: add E2E eval failure blame protocol

"Not related to our changes" is an extraordinary claim that requires
extraordinary proof. When evals fail during /ship:

1. Run the same eval on main — prove it fails there too
2. If it passes on main, it IS your change — trace the blame
3. If you can't verify, say "unverified" not "pre-existing"

Added to CLAUDE.md and as a comment in skill-e2e.test.ts.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* docs: update CONTRIBUTING.md and BROWSER.md for v0.4.2

CONTRIBUTING.md: update contributor mode description — now describes
periodic 0-10 reflection loop instead of passive friction detection.

BROWSER.md: add js/eval async documentation — await expressions are
auto-wrapped in async context, single-line eval returns values directly.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* fix: restore v0.4.2 changelog entries lost during cherry-pick conflict

The base branch detection entries from main were dropped when resolving
the CHANGELOG conflict — should have merged both sets, not replaced.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 BROWSER.md                     | 12 ++++++++
 CHANGELOG.md                   |  6 ++++
 CLAUDE.md                      | 15 ++++++++++
 CONTRIBUTING.md                | 10 ++++---
 SKILL.md                       | 24 +++++++++------
 browse/SKILL.md                | 24 +++++++++------
 browse/src/read-commands.ts    | 16 +++++++++-
 browse/test/commands.test.ts   | 54 ++++++++++++++++++++++++++++++++++
 plan-ceo-review/SKILL.md       | 24 +++++++++------
 plan-eng-review/SKILL.md       | 24 +++++++++------
 qa-only/SKILL.md               | 24 +++++++++------
 qa/SKILL.md                    | 24 +++++++++------
 retro/SKILL.md                 | 24 +++++++++------
 review/SKILL.md                | 24 +++++++++------
 scripts/gen-skill-docs.ts      | 24 +++++++++------
 setup-browser-cookies/SKILL.md | 24 +++++++++------
 ship/SKILL.md                  | 24 +++++++++------
 test/skill-e2e.test.ts         | 21 +++++++++++--
 test/skill-validation.test.ts  | 38 ++++++++++++++++++++++++
 19 files changed, 329 insertions(+), 107 deletions(-)

diff --git a/BROWSER.md b/BROWSER.md
index 2d828ebe..df4a6d1d 100644
--- a/BROWSER.md
+++ b/BROWSER.md
@@ -127,6 +127,18 @@ The `console`, `network`, and `dialog` commands read from the in-memory buffers,
 
 Dialogs (alert, confirm, prompt) are auto-accepted by default to prevent browser lockup. The `dialog-accept` and `dialog-dismiss` commands control this behavior. For prompts, `dialog-accept <text>` provides the response text. All dialogs are logged to the dialog buffer with type, message, and action taken.
 
+### JavaScript execution (`js` and `eval`)
+
+`js` runs a single expression, `eval` runs a JS file. Both support `await` — expressions containing `await` are automatically wrapped in an async context:
+
+```bash
+$B js "await fetch('/api/data').then(r => r.json())"  # works
+$B js "document.title"                                  # also works (no wrapping needed)
+$B eval my-script.js                                    # file with await works too
+```
+
+For `eval` files, single-line files return the expression value directly. Multi-line files need explicit `return` when using `await`. Comments containing "await" don't trigger wrapping.
+
 ### Multi-workspace support
 
 Each workspace gets its own isolated browser instance with its own Chromium process, tabs, cookies, and logs. State is stored in `.gstack/` inside the project root (detected via `git rev-parse --show-toplevel`).
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 3d67a917..9b4e93f9 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -2,6 +2,8 @@
 
 ## 0.4.2 — 2026-03-16
 
+- **`$B js "await fetch(...)"` now just works.** Any `await` expression in `$B js` or `$B eval` is automatically wrapped in an async context. No more `SyntaxError: await is only valid in async functions`. Single-line eval files return values directly; multi-line files use explicit `return`.
+- **Contributor mode now reflects, not just reacts.** Instead of only filing reports when something breaks, contributor mode now prompts periodic reflection: "Rate your gstack experience 0-10. Not a 10? Think about why." Catches quality-of-life issues and friction that passive detection misses. Reports now include a 0-10 rating and "What would make this a 10" to focus on actionable improvements.
 - **Skills now respect your branch target.** `/ship`, `/review`, `/qa`, and `/plan-ceo-review` detect which branch your PR actually targets instead of assuming `main`. Stacked branches, Conductor workspaces targeting feature branches, and repos using `master` all just work now.
 - **`/retro` works on any default branch.** Repos using `master`, `develop`, or other default branch names are detected automatically — no more empty retros because the branch name was wrong.
 - **New `{{BASE_BRANCH_DETECT}}` placeholder** for skill authors — drop it into any template and get 3-step branch detection (PR base → repo default → fallback) for free.
@@ -9,6 +11,10 @@
 
 ### For contributors
 
+- Added `hasAwait()` helper with comment-stripping to avoid false positives on `// await` in eval files.
+- Smart eval wrapping: single-line → expression `(...)`, multi-line → block `{...}` with explicit `return`.
+- 6 new async wrapping unit tests, 40 new contributor mode preamble validation tests.
+- Calibration example framed as historical ("used to fail") to avoid implying a live bug post-fix.
 - Added "Writing SKILL templates" section to CLAUDE.md — rules for natural language over bash-isms, dynamic branch detection, self-contained code blocks.
 - Hardcoded-main regression test scans all `.tmpl` files for git commands with hardcoded `main`.
 - QA template cleaned up: removed `REPORT_DIR` shell variable, simplified port detection to prose.
diff --git a/CLAUDE.md b/CLAUDE.md
index bc21f606..6f12deae 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -118,6 +118,21 @@ CHANGELOG.md is **for users**, not contributors. Write it like product release n
 - No jargon: say "every question now tells you which project and branch you're in" not
   "AskUserQuestion format standardized across skill templates via preamble resolver."
 
+## E2E eval failure blame protocol
+
+When an E2E eval fails during `/ship` or any other workflow, **never claim "not
+related to our changes" without proving it.** These systems have invisible couplings —
+a preamble text change affects agent behavior, a new helper changes timing, a
+regenerated SKILL.md shifts prompt context.
+
+**Required before attributing a failure to "pre-existing":**
+1. Run the same eval on main (or base branch) and show it fails there too
+2. If it passes on main but fails on the branch — it IS your change. Trace the blame.
+3. If you can't run on main, say "unverified — may or may not be related" and flag it
+   as a risk in the PR body
+
+"Pre-existing" without receipts is a lazy claim. Prove it or don't say it.
+
 ## Deploying to the active skill
 
 The active skill lives at `~/.claude/skills/gstack/`. After making changes:
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index b06b837e..4af2e889 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -22,9 +22,11 @@ bin/dev-teardown               # deactivate — back to your global install
 
 ## Contributor mode
 
-Contributor mode is for people who want to fix gstack when it annoys them. Enable it
-and Claude Code will automatically log issues to `~/.gstack/contributor-logs/` as you
-work — what you were doing, what went wrong, repro steps, raw output.
+Contributor mode turns gstack into a self-improving tool. Enable it and Claude Code
+will periodically reflect on its gstack experience — rating it 0-10 at the end of
+each major workflow step. When something isn't a 10, it thinks about why and files
+a report to `~/.gstack/contributor-logs/` with what happened, repro steps, and what
+would make it better.
 
 ```bash
 ~/.claude/skills/gstack/bin/gstack-config set gstack_contributor true
@@ -36,7 +38,7 @@ the issue, fix it, and open a PR.
 
 ### The contributor workflow
 
-1. **Hit friction while using gstack** — contributor mode logs it automatically
+1. **Use gstack normally** — contributor mode reflects and logs issues automatically
 2. **Check your logs:** `ls ~/.gstack/contributor-logs/`
 3. **Fork and clone gstack** (if you haven't already)
 4. **Symlink your fork into the project where you hit the bug:**
diff --git a/SKILL.md b/SKILL.md
index b362e824..2239a91b 100644
--- a/SKILL.md
+++ b/SKILL.md
@@ -44,12 +44,15 @@ Per-skill instructions may add additional formatting rules on top of this baseli
 
 ## Contributor Mode
 
-If `_CONTRIB` is `true`: you are in **contributor mode**. When you hit friction with **gstack itself** (not the user's app), file a field report. Think: "hey, I was trying to do X with gstack and it didn't work / was confusing / was annoying. Here's what happened."
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
 
-**gstack issues:** browse command fails/wrong output, snapshot missing elements, skill instructions unclear or misleading, binary crash/hang, unhelpful error message, any rough edge or annoyance — even minor stuff.
-**NOT gstack issues:** user's app bugs, network errors to user's URL, auth failures on user's site.
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
 
-**To file:** write `~/.gstack/contributor-logs/{slug}.md` with this structure:
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
 
 ```
 # {Title}
@@ -58,20 +61,23 @@ Hey gstack team — ran into this while using /{skill-name}:
 
 **What I was trying to do:** {what the user/agent was attempting}
 **What happened instead:** {what actually happened}
-**How annoying (1-5):** {1=meh, 3=friction, 5=blocker}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
 
 ## Steps to reproduce
 1. {step}
 
 ## Raw output
-(wrap any error messages or unexpected output in a markdown code block)
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
 
 **Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
 ```
 
-Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-logs/{slug}.md`
-
-Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
 # gstack browse: QA Testing & Dogfooding
 
diff --git a/browse/SKILL.md b/browse/SKILL.md
index 28e976df..c0d7a4eb 100644
--- a/browse/SKILL.md
+++ b/browse/SKILL.md
@@ -44,12 +44,15 @@ Per-skill instructions may add additional formatting rules on top of this baseli
 
 ## Contributor Mode
 
-If `_CONTRIB` is `true`: you are in **contributor mode**. When you hit friction with **gstack itself** (not the user's app), file a field report. Think: "hey, I was trying to do X with gstack and it didn't work / was confusing / was annoying. Here's what happened."
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
 
-**gstack issues:** browse command fails/wrong output, snapshot missing elements, skill instructions unclear or misleading, binary crash/hang, unhelpful error message, any rough edge or annoyance — even minor stuff.
-**NOT gstack issues:** user's app bugs, network errors to user's URL, auth failures on user's site.
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
 
-**To file:** write `~/.gstack/contributor-logs/{slug}.md` with this structure:
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
 
 ```
 # {Title}
@@ -58,20 +61,23 @@ Hey gstack team — ran into this while using /{skill-name}:
 
 **What I was trying to do:** {what the user/agent was attempting}
 **What happened instead:** {what actually happened}
-**How annoying (1-5):** {1=meh, 3=friction, 5=blocker}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
 
 ## Steps to reproduce
 1. {step}
 
 ## Raw output
-(wrap any error messages or unexpected output in a markdown code block)
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
 
 **Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
 ```
 
-Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-logs/{slug}.md`
-
-Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
 # browse: QA Testing & Dogfooding
 
diff --git a/browse/src/read-commands.ts b/browse/src/read-commands.ts
index 53efec8a..a7d76352 100644
--- a/browse/src/read-commands.ts
+++ b/browse/src/read-commands.ts
@@ -11,6 +11,12 @@ import type { Page } from 'playwright';
 import * as fs from 'fs';
 import * as path from 'path';
 
+/** Detect await keyword, ignoring comments. Accepted risk: await in string literals triggers wrapping (harmless). */
+function hasAwait(code: string): boolean {
+  const stripped = code.replace(/\/\/.*$/gm, '').replace(/\/\*[\s\S]*?\*\//g, '');
+  return /\bawait\b/.test(stripped);
+}
+
 // Security: Path validation to prevent path traversal attacks
 const SAFE_DIRECTORIES = ['/tmp', process.cwd()];
 
@@ -118,7 +124,8 @@ export async function handleReadCommand(
     case 'js': {
       const expr = args[0];
       if (!expr) throw new Error('Usage: browse js <expression>');
-      const result = await page.evaluate(expr);
+      const wrapped = hasAwait(expr) ? `(async()=>(${expr}))()` : expr;
+      const result = await page.evaluate(wrapped);
       return typeof result === 'object' ? JSON.stringify(result, null, 2) : String(result ?? '');
     }
 
@@ -128,6 +135,13 @@ export async function handleReadCommand(
       validateReadPath(filePath);
       if (!fs.existsSync(filePath)) throw new Error(`File not found: ${filePath}`);
       const code = fs.readFileSync(filePath, 'utf-8');
+      if (hasAwait(code)) {
+        const trimmed = code.trim();
+        const isSingleExpr = trimmed.split('\n').length === 1;
+        const wrapped = isSingleExpr ? `(async()=>(${trimmed}))()` : `(async()=>{\n${code}\n})()`;
+        const result = await page.evaluate(wrapped);
+        return typeof result === 'object' ? JSON.stringify(result, null, 2) : String(result ?? '');
+      }
       const result = await page.evaluate(code);
       return typeof result === 'object' ? JSON.stringify(result, null, 2) : String(result ?? '');
     }
diff --git a/browse/test/commands.test.ts b/browse/test/commands.test.ts
index a3e201d9..d8aaeab6 100644
--- a/browse/test/commands.test.ts
+++ b/browse/test/commands.test.ts
@@ -144,6 +144,60 @@ describe('Inspection', () => {
     expect(obj.b).toBe(2);
   });
 
+  test('js supports await expressions', async () => {
+    const result = await handleReadCommand('js', ['await Promise.resolve(42)'], bm);
+    expect(result).toBe('42');
+  });
+
+  test('js does not false-positive on await substring', async () => {
+    const result = await handleReadCommand('js', ['(() => { const awaitable = 5; return awaitable })()'], bm);
+    expect(result).toBe('5');
+  });
+
+  test('eval supports await in single-line file', async () => {
+    const tmp = '/tmp/eval-await-test.js';
+    fs.writeFileSync(tmp, 'await Promise.resolve("hello from eval")');
+    try {
+      const result = await handleReadCommand('eval', [tmp], bm);
+      expect(result).toBe('hello from eval');
+    } finally {
+      fs.unlinkSync(tmp);
+    }
+  });
+
+  test('eval does not wrap when await is only in a comment', async () => {
+    const tmp = '/tmp/eval-comment-test.js';
+    fs.writeFileSync(tmp, '// no need to await this\ndocument.title');
+    try {
+      const result = await handleReadCommand('eval', [tmp], bm);
+      expect(result).toBe('Test Page - Basic');
+    } finally {
+      fs.unlinkSync(tmp);
+    }
+  });
+
+  test('eval multi-line with await and explicit return', async () => {
+    const tmp = '/tmp/eval-multiline-await.js';
+    fs.writeFileSync(tmp, 'const data = await Promise.resolve("multi");\nreturn data;');
+    try {
+      const result = await handleReadCommand('eval', [tmp], bm);
+      expect(result).toBe('multi');
+    } finally {
+      fs.unlinkSync(tmp);
+    }
+  });
+
+  test('eval multi-line with await but no return gives empty string', async () => {
+    const tmp = '/tmp/eval-multiline-no-return.js';
+    fs.writeFileSync(tmp, 'const data = await Promise.resolve("lost");\ndata;');
+    try {
+      const result = await handleReadCommand('eval', [tmp], bm);
+      expect(result).toBe('');
+    } finally {
+      fs.unlinkSync(tmp);
+    }
+  });
+
   test('css returns computed property', async () => {
     const result = await handleReadCommand('css', ['h1', 'color'], bm);
     // Navy color
diff --git a/plan-ceo-review/SKILL.md b/plan-ceo-review/SKILL.md
index 77ca6438..07830998 100644
--- a/plan-ceo-review/SKILL.md
+++ b/plan-ceo-review/SKILL.md
@@ -44,12 +44,15 @@ Per-skill instructions may add additional formatting rules on top of this baseli
 
 ## Contributor Mode
 
-If `_CONTRIB` is `true`: you are in **contributor mode**. When you hit friction with **gstack itself** (not the user's app), file a field report. Think: "hey, I was trying to do X with gstack and it didn't work / was confusing / was annoying. Here's what happened."
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
 
-**gstack issues:** browse command fails/wrong output, snapshot missing elements, skill instructions unclear or misleading, binary crash/hang, unhelpful error message, any rough edge or annoyance — even minor stuff.
-**NOT gstack issues:** user's app bugs, network errors to user's URL, auth failures on user's site.
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
 
-**To file:** write `~/.gstack/contributor-logs/{slug}.md` with this structure:
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
 
 ```
 # {Title}
@@ -58,20 +61,23 @@ Hey gstack team — ran into this while using /{skill-name}:
 
 **What I was trying to do:** {what the user/agent was attempting}
 **What happened instead:** {what actually happened}
-**How annoying (1-5):** {1=meh, 3=friction, 5=blocker}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
 
 ## Steps to reproduce
 1. {step}
 
 ## Raw output
-(wrap any error messages or unexpected output in a markdown code block)
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
 
 **Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
 ```
 
-Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-logs/{slug}.md`
-
-Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
 ## Step 0: Detect base branch
 
diff --git a/plan-eng-review/SKILL.md b/plan-eng-review/SKILL.md
index 819ef072..ad2baca6 100644
--- a/plan-eng-review/SKILL.md
+++ b/plan-eng-review/SKILL.md
@@ -44,12 +44,15 @@ Per-skill instructions may add additional formatting rules on top of this baseli
 
 ## Contributor Mode
 
-If `_CONTRIB` is `true`: you are in **contributor mode**. When you hit friction with **gstack itself** (not the user's app), file a field report. Think: "hey, I was trying to do X with gstack and it didn't work / was confusing / was annoying. Here's what happened."
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
 
-**gstack issues:** browse command fails/wrong output, snapshot missing elements, skill instructions unclear or misleading, binary crash/hang, unhelpful error message, any rough edge or annoyance — even minor stuff.
-**NOT gstack issues:** user's app bugs, network errors to user's URL, auth failures on user's site.
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
 
-**To file:** write `~/.gstack/contributor-logs/{slug}.md` with this structure:
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
 
 ```
 # {Title}
@@ -58,20 +61,23 @@ Hey gstack team — ran into this while using /{skill-name}:
 
 **What I was trying to do:** {what the user/agent was attempting}
 **What happened instead:** {what actually happened}
-**How annoying (1-5):** {1=meh, 3=friction, 5=blocker}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
 
 ## Steps to reproduce
 1. {step}
 
 ## Raw output
-(wrap any error messages or unexpected output in a markdown code block)
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
 
 **Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
 ```
 
-Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-logs/{slug}.md`
-
-Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
 # Plan Review Mode
 
diff --git a/qa-only/SKILL.md b/qa-only/SKILL.md
index 438b7826..27d939be 100644
--- a/qa-only/SKILL.md
+++ b/qa-only/SKILL.md
@@ -43,12 +43,15 @@ Per-skill instructions may add additional formatting rules on top of this baseli
 
 ## Contributor Mode
 
-If `_CONTRIB` is `true`: you are in **contributor mode**. When you hit friction with **gstack itself** (not the user's app), file a field report. Think: "hey, I was trying to do X with gstack and it didn't work / was confusing / was annoying. Here's what happened."
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
 
-**gstack issues:** browse command fails/wrong output, snapshot missing elements, skill instructions unclear or misleading, binary crash/hang, unhelpful error message, any rough edge or annoyance — even minor stuff.
-**NOT gstack issues:** user's app bugs, network errors to user's URL, auth failures on user's site.
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
 
-**To file:** write `~/.gstack/contributor-logs/{slug}.md` with this structure:
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
 
 ```
 # {Title}
@@ -57,20 +60,23 @@ Hey gstack team — ran into this while using /{skill-name}:
 
 **What I was trying to do:** {what the user/agent was attempting}
 **What happened instead:** {what actually happened}
-**How annoying (1-5):** {1=meh, 3=friction, 5=blocker}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
 
 ## Steps to reproduce
 1. {step}
 
 ## Raw output
-(wrap any error messages or unexpected output in a markdown code block)
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
 
 **Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
 ```
 
-Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-logs/{slug}.md`
-
-Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
 # /qa-only: Report-Only QA Testing
 
diff --git a/qa/SKILL.md b/qa/SKILL.md
index 5ea4643a..938bf10b 100644
--- a/qa/SKILL.md
+++ b/qa/SKILL.md
@@ -48,12 +48,15 @@ Per-skill instructions may add additional formatting rules on top of this baseli
 
 ## Contributor Mode
 
-If `_CONTRIB` is `true`: you are in **contributor mode**. When you hit friction with **gstack itself** (not the user's app), file a field report. Think: "hey, I was trying to do X with gstack and it didn't work / was confusing / was annoying. Here's what happened."
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
 
-**gstack issues:** browse command fails/wrong output, snapshot missing elements, skill instructions unclear or misleading, binary crash/hang, unhelpful error message, any rough edge or annoyance — even minor stuff.
-**NOT gstack issues:** user's app bugs, network errors to user's URL, auth failures on user's site.
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
 
-**To file:** write `~/.gstack/contributor-logs/{slug}.md` with this structure:
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
 
 ```
 # {Title}
@@ -62,20 +65,23 @@ Hey gstack team — ran into this while using /{skill-name}:
 
 **What I was trying to do:** {what the user/agent was attempting}
 **What happened instead:** {what actually happened}
-**How annoying (1-5):** {1=meh, 3=friction, 5=blocker}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
 
 ## Steps to reproduce
 1. {step}
 
 ## Raw output
-(wrap any error messages or unexpected output in a markdown code block)
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
 
 **Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
 ```
 
-Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-logs/{slug}.md`
-
-Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
 ## Step 0: Detect base branch
 
diff --git a/retro/SKILL.md b/retro/SKILL.md
index ca44f49e..39b7ee13 100644
--- a/retro/SKILL.md
+++ b/retro/SKILL.md
@@ -43,12 +43,15 @@ Per-skill instructions may add additional formatting rules on top of this baseli
 
 ## Contributor Mode
 
-If `_CONTRIB` is `true`: you are in **contributor mode**. When you hit friction with **gstack itself** (not the user's app), file a field report. Think: "hey, I was trying to do X with gstack and it didn't work / was confusing / was annoying. Here's what happened."
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
 
-**gstack issues:** browse command fails/wrong output, snapshot missing elements, skill instructions unclear or misleading, binary crash/hang, unhelpful error message, any rough edge or annoyance — even minor stuff.
-**NOT gstack issues:** user's app bugs, network errors to user's URL, auth failures on user's site.
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
 
-**To file:** write `~/.gstack/contributor-logs/{slug}.md` with this structure:
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
 
 ```
 # {Title}
@@ -57,20 +60,23 @@ Hey gstack team — ran into this while using /{skill-name}:
 
 **What I was trying to do:** {what the user/agent was attempting}
 **What happened instead:** {what actually happened}
-**How annoying (1-5):** {1=meh, 3=friction, 5=blocker}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
 
 ## Steps to reproduce
 1. {step}
 
 ## Raw output
-(wrap any error messages or unexpected output in a markdown code block)
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
 
 **Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
 ```
 
-Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-logs/{slug}.md`
-
-Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
 ## Detect default branch
 
diff --git a/review/SKILL.md b/review/SKILL.md
index 949a0c65..b94f8a30 100644
--- a/review/SKILL.md
+++ b/review/SKILL.md
@@ -44,12 +44,15 @@ Per-skill instructions may add additional formatting rules on top of this baseli
 
 ## Contributor Mode
 
-If `_CONTRIB` is `true`: you are in **contributor mode**. When you hit friction with **gstack itself** (not the user's app), file a field report. Think: "hey, I was trying to do X with gstack and it didn't work / was confusing / was annoying. Here's what happened."
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
 
-**gstack issues:** browse command fails/wrong output, snapshot missing elements, skill instructions unclear or misleading, binary crash/hang, unhelpful error message, any rough edge or annoyance — even minor stuff.
-**NOT gstack issues:** user's app bugs, network errors to user's URL, auth failures on user's site.
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
 
-**To file:** write `~/.gstack/contributor-logs/{slug}.md` with this structure:
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
 
 ```
 # {Title}
@@ -58,20 +61,23 @@ Hey gstack team — ran into this while using /{skill-name}:
 
 **What I was trying to do:** {what the user/agent was attempting}
 **What happened instead:** {what actually happened}
-**How annoying (1-5):** {1=meh, 3=friction, 5=blocker}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
 
 ## Steps to reproduce
 1. {step}
 
 ## Raw output
-(wrap any error messages or unexpected output in a markdown code block)
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
 
 **Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
 ```
 
-Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-logs/{slug}.md`
-
-Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
 ## Step 0: Detect base branch
 
diff --git a/scripts/gen-skill-docs.ts b/scripts/gen-skill-docs.ts
index 9c81e968..f3d93dbb 100644
--- a/scripts/gen-skill-docs.ts
+++ b/scripts/gen-skill-docs.ts
@@ -123,12 +123,15 @@ Per-skill instructions may add additional formatting rules on top of this baseli
 
 ## Contributor Mode
 
-If \`_CONTRIB\` is \`true\`: you are in **contributor mode**. When you hit friction with **gstack itself** (not the user's app), file a field report. Think: "hey, I was trying to do X with gstack and it didn't work / was confusing / was annoying. Here's what happened."
+If \`_CONTRIB\` is \`true\`: you are in **contributor mode**. You're a gstack user who also helps make it better.
 
-**gstack issues:** browse command fails/wrong output, snapshot missing elements, skill instructions unclear or misleading, binary crash/hang, unhelpful error message, any rough edge or annoyance — even minor stuff.
-**NOT gstack issues:** user's app bugs, network errors to user's URL, auth failures on user's site.
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
 
-**To file:** write \`~/.gstack/contributor-logs/{slug}.md\` with this structure:
+**Calibration — this is the bar:** For example, \`$B js "await fetch(...)"\` used to fail with \`SyntaxError: await is only valid in async functions\` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write \`~/.gstack/contributor-logs/{slug}.md\` with **all sections below** (do not truncate — include every section through the Date/Version footer):
 
 \`\`\`
 # {Title}
@@ -137,20 +140,23 @@ Hey gstack team — ran into this while using /{skill-name}:
 
 **What I was trying to do:** {what the user/agent was attempting}
 **What happened instead:** {what actually happened}
-**How annoying (1-5):** {1=meh, 3=friction, 5=blocker}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
 
 ## Steps to reproduce
 1. {step}
 
 ## Raw output
-(wrap any error messages or unexpected output in a markdown code block)
+\`\`\`
+{paste the actual error or unexpected output here}
+\`\`\`
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
 
 **Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
 \`\`\`
 
-Then run: \`mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-logs/{slug}.md\`
-
-Slug: lowercase, hyphens, max 60 chars (e.g. \`browse-snapshot-ref-gap\`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"`;
+Slug: lowercase, hyphens, max 60 chars (e.g. \`browse-js-no-await\`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"`;
 }
 
 function generateBrowseSetup(): string {
diff --git a/setup-browser-cookies/SKILL.md b/setup-browser-cookies/SKILL.md
index 06230249..d522b270 100644
--- a/setup-browser-cookies/SKILL.md
+++ b/setup-browser-cookies/SKILL.md
@@ -41,12 +41,15 @@ Per-skill instructions may add additional formatting rules on top of this baseli
 
 ## Contributor Mode
 
-If `_CONTRIB` is `true`: you are in **contributor mode**. When you hit friction with **gstack itself** (not the user's app), file a field report. Think: "hey, I was trying to do X with gstack and it didn't work / was confusing / was annoying. Here's what happened."
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
 
-**gstack issues:** browse command fails/wrong output, snapshot missing elements, skill instructions unclear or misleading, binary crash/hang, unhelpful error message, any rough edge or annoyance — even minor stuff.
-**NOT gstack issues:** user's app bugs, network errors to user's URL, auth failures on user's site.
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
 
-**To file:** write `~/.gstack/contributor-logs/{slug}.md` with this structure:
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
 
 ```
 # {Title}
@@ -55,20 +58,23 @@ Hey gstack team — ran into this while using /{skill-name}:
 
 **What I was trying to do:** {what the user/agent was attempting}
 **What happened instead:** {what actually happened}
-**How annoying (1-5):** {1=meh, 3=friction, 5=blocker}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
 
 ## Steps to reproduce
 1. {step}
 
 ## Raw output
-(wrap any error messages or unexpected output in a markdown code block)
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
 
 **Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
 ```
 
-Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-logs/{slug}.md`
-
-Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
 # Setup Browser Cookies
 
diff --git a/ship/SKILL.md b/ship/SKILL.md
index 47a9da11..7791f4bc 100644
--- a/ship/SKILL.md
+++ b/ship/SKILL.md
@@ -43,12 +43,15 @@ Per-skill instructions may add additional formatting rules on top of this baseli
 
 ## Contributor Mode
 
-If `_CONTRIB` is `true`: you are in **contributor mode**. When you hit friction with **gstack itself** (not the user's app), file a field report. Think: "hey, I was trying to do X with gstack and it didn't work / was confusing / was annoying. Here's what happened."
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
 
-**gstack issues:** browse command fails/wrong output, snapshot missing elements, skill instructions unclear or misleading, binary crash/hang, unhelpful error message, any rough edge or annoyance — even minor stuff.
-**NOT gstack issues:** user's app bugs, network errors to user's URL, auth failures on user's site.
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
 
-**To file:** write `~/.gstack/contributor-logs/{slug}.md` with this structure:
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
 
 ```
 # {Title}
@@ -57,20 +60,23 @@ Hey gstack team — ran into this while using /{skill-name}:
 
 **What I was trying to do:** {what the user/agent was attempting}
 **What happened instead:** {what actually happened}
-**How annoying (1-5):** {1=meh, 3=friction, 5=blocker}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
 
 ## Steps to reproduce
 1. {step}
 
 ## Raw output
-(wrap any error messages or unexpected output in a markdown code block)
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
 
 **Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
 ```
 
-Then run: `mkdir -p ~/.gstack/contributor-logs && open ~/.gstack/contributor-logs/{slug}.md`
-
-Slug: lowercase, hyphens, max 60 chars (e.g. `browse-snapshot-ref-gap`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
 
 ## Step 0: Detect base branch
 
diff --git a/test/skill-e2e.test.ts b/test/skill-e2e.test.ts
index 4978ce53..aa50a976 100644
--- a/test/skill-e2e.test.ts
+++ b/test/skill-e2e.test.ts
@@ -13,6 +13,11 @@ import * as os from 'os';
 const ROOT = path.resolve(import.meta.dir, '..');
 
 // Skip unless EVALS=1. Session runner strips CLAUDE* env vars to avoid nested session issues.
+//
+// BLAME PROTOCOL: When an eval fails, do NOT claim "pre-existing" or "not related
+// to our changes" without proof. Run the same eval on main to verify. These tests
+// have invisible couplings — preamble text, SKILL.md content, and timing all affect
+// agent behavior. See CLAUDE.md "E2E eval failure blame protocol" for details.
 const evalsEnabled = !!process.env.EVALS;
 const describeE2E = evalsEnabled ? describe : describe.skip;
 
@@ -322,10 +327,16 @@ File a contributor report about this issue. Then tell me what you filed.`,
     const logFiles = fs.readdirSync(logsDir).filter(f => f.endsWith('.md'));
     expect(logFiles.length).toBeGreaterThan(0);
 
+    // Verify new reflection-based format
     const logContent = fs.readFileSync(path.join(logsDir, logFiles[0]), 'utf-8');
     expect(logContent).toContain('Hey gstack team');
     expect(logContent).toContain('What I was trying to do');
     expect(logContent).toContain('What happened instead');
+    expect(logContent).toMatch(/rating/i);
+    // Verify report has repro steps (agent may use "Steps to reproduce", "Repro Steps", etc.)
+    expect(logContent).toMatch(/repro|steps to reproduce|how to reproduce/i);
+    // Verify report has date/version footer (agent may format differently)
+    expect(logContent).toMatch(/date.*2026|2026.*date/i);
 
     // Clean up
     try { fs.rmSync(contribDir, { recursive: true, force: true }); } catch {}
@@ -424,16 +435,20 @@ describeE2E('QA skill E2E', () => {
 
   test('/qa quick completes without browse errors', async () => {
     const result = await runSkillTest({
-      prompt: `You have a browse binary at ${browseBin}. Assign it to B variable like: B="${browseBin}"
+      prompt: `B="${browseBin}"
+
+The test server is already running at: ${testServer.url}
+Target page: ${testServer.url}/basic.html
 
 Read the file qa/SKILL.md for the QA workflow instructions.
 
 Run a Quick-depth QA test on ${testServer.url}/basic.html
 Do NOT use AskUserQuestion — run Quick tier directly.
+Do NOT try to start a server or discover ports — the URL above is ready.
 Write your report to ${qaDir}/qa-reports/qa-report.md`,
       workingDirectory: qaDir,
       maxTurns: 35,
-      timeout: 180_000,
+      timeout: 240_000,
       testName: 'qa-quick',
       runId,
     });
@@ -448,7 +463,7 @@ Write your report to ${qaDir}/qa-reports/qa-report.md`,
     }
     // Accept error_max_turns — the agent doing thorough QA work is not a failure
     expect(['success', 'error_max_turns']).toContain(result.exitReason);
-  }, 240_000);
+  }, 300_000);
 });
 
 // --- B5: Review skill E2E ---
diff --git a/test/skill-validation.test.ts b/test/skill-validation.test.ts
index 2a947b15..3ff5c356 100644
--- a/test/skill-validation.test.ts
+++ b/test/skill-validation.test.ts
@@ -496,6 +496,44 @@ describe('v0.4.1 preamble features', () => {
   }
 });
 
+// --- Contributor mode preamble structure validation ---
+
+describe('Contributor mode preamble structure', () => {
+  const skillsWithPreamble = [
+    'SKILL.md', 'browse/SKILL.md', 'qa/SKILL.md',
+    'qa-only/SKILL.md',
+    'setup-browser-cookies/SKILL.md',
+    'ship/SKILL.md', 'review/SKILL.md',
+    'plan-ceo-review/SKILL.md', 'plan-eng-review/SKILL.md',
+    'retro/SKILL.md',
+  ];
+
+  for (const skill of skillsWithPreamble) {
+    test(`${skill} has 0-10 rating in contributor mode`, () => {
+      const content = fs.readFileSync(path.join(ROOT, skill), 'utf-8');
+      expect(content).toContain('0 to 10');
+      expect(content).toContain('My rating');
+    });
+
+    test(`${skill} has calibration example`, () => {
+      const content = fs.readFileSync(path.join(ROOT, skill), 'utf-8');
+      expect(content).toContain('Calibration');
+      expect(content).toContain('the bar');
+    });
+
+    test(`${skill} has "what would make this a 10" field`, () => {
+      const content = fs.readFileSync(path.join(ROOT, skill), 'utf-8');
+      expect(content).toContain('What would make this a 10');
+    });
+
+    test(`${skill} uses periodic reflection (not per-command)`, () => {
+      const content = fs.readFileSync(path.join(ROOT, skill), 'utf-8');
+      expect(content).toContain('workflow step');
+      expect(content).not.toContain('After you use gstack-provided CLIs');
+    });
+  }
+});
+
 describe('Enum & Value Completeness in review checklist', () => {
   const checklist = fs.readFileSync(path.join(ROOT, 'review', 'checklist.md'), 'utf-8');
 

From 276d0cc6cb944f295377675f7dff57b916d2c29f Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Mon, 16 Mar 2026 12:27:47 -0500
Subject: [PATCH 03/22] feat: always-on ELI16 + branch detection (v0.4.3)
 (#108)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* feat: always-on ELI16 + branch detection in preamble

- Add _BRANCH detection to preamble bash block (git branch --show-current)
- Merge ELI16 rules into default AskUserQuestion format (always-on)
- Remove _SESSIONS >= 3 conditional — better questions always
- Add simplification rules: plain English, no jargon, no raw function names
- Update tests for branch detection and simplification regression guard

* chore: bump version and changelog (v0.4.3)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 CHANGELOG.md                   | 11 +++++++++++
 SKILL.md                       | 12 +++++++-----
 VERSION                        |  2 +-
 browse/SKILL.md                | 12 +++++++-----
 plan-ceo-review/SKILL.md       | 12 +++++++-----
 plan-eng-review/SKILL.md       | 12 +++++++-----
 qa-only/SKILL.md               | 12 +++++++-----
 qa/SKILL.md                    | 12 +++++++-----
 retro/SKILL.md                 | 12 +++++++-----
 review/SKILL.md                | 12 +++++++-----
 scripts/gen-skill-docs.ts      | 12 +++++++-----
 setup-browser-cookies/SKILL.md | 12 +++++++-----
 ship/SKILL.md                  | 12 +++++++-----
 test/gen-skill-docs.test.ts    | 13 ++++++++++++-
 test/skill-validation.test.ts  |  2 +-
 15 files changed, 102 insertions(+), 58 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 9b4e93f9..99b7086c 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,16 @@
 # Changelog
 
+## 0.4.3 — 2026-03-16
+
+- **Every question is now crystal clear, every time.** You used to need 3+ sessions running before gstack would give you full context and plain English explanations. Now every question — even in a single session — tells you the project, branch, and what's happening, explained simply enough to understand mid-context-switch. No more "sorry, explain it to me more simply."
+- **Branch name is always correct.** gstack now detects your current branch at runtime instead of relying on the snapshot from when the conversation started. Switch branches mid-session? gstack keeps up.
+
+### For contributors
+
+- Merged ELI16 rules into base AskUserQuestion format — one format instead of two, no `_SESSIONS >= 3` conditional.
+- Added `_BRANCH` detection to preamble bash block (`git branch --show-current` with fallback).
+- Added regression guard tests for branch detection and simplification rules.
+
 ## 0.4.2 — 2026-03-16
 
 - **`$B js "await fetch(...)"` now just works.** Any `await` expression in `$B js` or `$B eval` is automatically wrapped in an async context. No more `SyntaxError: await is only valid in async functions`. Single-line eval files return values directly; multi-line files use explicit `return`.
diff --git a/SKILL.md b/SKILL.md
index 2239a91b..76007eee 100644
--- a/SKILL.md
+++ b/SKILL.md
@@ -26,6 +26,8 @@ touch ~/.gstack/sessions/"$PPID"
 _SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
 find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
@@ -33,12 +35,12 @@ If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/g
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
-1. Context: project name, current branch, what we're working on (1-2 sentences)
-2. The specific question or decision point
-3. `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. Lettered options: `A) ... B) ... C) ...`
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
 
-If `_SESSIONS` is 3 or more: the user is juggling multiple gstack sessions and context-switching heavily. **ELI16 mode** — they may not remember what this conversation is about. Every AskUserQuestion MUST re-ground them: state the project, the branch, the current plan/task, then the specific problem, THEN the recommendation and options. Be extra clear and self-contained — assume they haven't looked at this window in 20 minutes.
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
diff --git a/VERSION b/VERSION
index 2b7c5ae0..17b2ccd9 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.4.2
+0.4.3
diff --git a/browse/SKILL.md b/browse/SKILL.md
index c0d7a4eb..dd473dc0 100644
--- a/browse/SKILL.md
+++ b/browse/SKILL.md
@@ -26,6 +26,8 @@ touch ~/.gstack/sessions/"$PPID"
 _SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
 find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
@@ -33,12 +35,12 @@ If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/g
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
-1. Context: project name, current branch, what we're working on (1-2 sentences)
-2. The specific question or decision point
-3. `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. Lettered options: `A) ... B) ... C) ...`
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
 
-If `_SESSIONS` is 3 or more: the user is juggling multiple gstack sessions and context-switching heavily. **ELI16 mode** — they may not remember what this conversation is about. Every AskUserQuestion MUST re-ground them: state the project, the branch, the current plan/task, then the specific problem, THEN the recommendation and options. Be extra clear and self-contained — assume they haven't looked at this window in 20 minutes.
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
diff --git a/plan-ceo-review/SKILL.md b/plan-ceo-review/SKILL.md
index 07830998..b05db5e9 100644
--- a/plan-ceo-review/SKILL.md
+++ b/plan-ceo-review/SKILL.md
@@ -26,6 +26,8 @@ touch ~/.gstack/sessions/"$PPID"
 _SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
 find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
@@ -33,12 +35,12 @@ If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/g
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
-1. Context: project name, current branch, what we're working on (1-2 sentences)
-2. The specific question or decision point
-3. `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. Lettered options: `A) ... B) ... C) ...`
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
 
-If `_SESSIONS` is 3 or more: the user is juggling multiple gstack sessions and context-switching heavily. **ELI16 mode** — they may not remember what this conversation is about. Every AskUserQuestion MUST re-ground them: state the project, the branch, the current plan/task, then the specific problem, THEN the recommendation and options. Be extra clear and self-contained — assume they haven't looked at this window in 20 minutes.
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
diff --git a/plan-eng-review/SKILL.md b/plan-eng-review/SKILL.md
index ad2baca6..4cd8f481 100644
--- a/plan-eng-review/SKILL.md
+++ b/plan-eng-review/SKILL.md
@@ -26,6 +26,8 @@ touch ~/.gstack/sessions/"$PPID"
 _SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
 find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
@@ -33,12 +35,12 @@ If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/g
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
-1. Context: project name, current branch, what we're working on (1-2 sentences)
-2. The specific question or decision point
-3. `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. Lettered options: `A) ... B) ... C) ...`
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
 
-If `_SESSIONS` is 3 or more: the user is juggling multiple gstack sessions and context-switching heavily. **ELI16 mode** — they may not remember what this conversation is about. Every AskUserQuestion MUST re-ground them: state the project, the branch, the current plan/task, then the specific problem, THEN the recommendation and options. Be extra clear and self-contained — assume they haven't looked at this window in 20 minutes.
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
diff --git a/qa-only/SKILL.md b/qa-only/SKILL.md
index 27d939be..5e74f03e 100644
--- a/qa-only/SKILL.md
+++ b/qa-only/SKILL.md
@@ -25,6 +25,8 @@ touch ~/.gstack/sessions/"$PPID"
 _SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
 find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
@@ -32,12 +34,12 @@ If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/g
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
-1. Context: project name, current branch, what we're working on (1-2 sentences)
-2. The specific question or decision point
-3. `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. Lettered options: `A) ... B) ... C) ...`
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
 
-If `_SESSIONS` is 3 or more: the user is juggling multiple gstack sessions and context-switching heavily. **ELI16 mode** — they may not remember what this conversation is about. Every AskUserQuestion MUST re-ground them: state the project, the branch, the current plan/task, then the specific problem, THEN the recommendation and options. Be extra clear and self-contained — assume they haven't looked at this window in 20 minutes.
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
diff --git a/qa/SKILL.md b/qa/SKILL.md
index 938bf10b..6b078a9d 100644
--- a/qa/SKILL.md
+++ b/qa/SKILL.md
@@ -30,6 +30,8 @@ touch ~/.gstack/sessions/"$PPID"
 _SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
 find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
@@ -37,12 +39,12 @@ If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/g
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
-1. Context: project name, current branch, what we're working on (1-2 sentences)
-2. The specific question or decision point
-3. `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. Lettered options: `A) ... B) ... C) ...`
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
 
-If `_SESSIONS` is 3 or more: the user is juggling multiple gstack sessions and context-switching heavily. **ELI16 mode** — they may not remember what this conversation is about. Every AskUserQuestion MUST re-ground them: state the project, the branch, the current plan/task, then the specific problem, THEN the recommendation and options. Be extra clear and self-contained — assume they haven't looked at this window in 20 minutes.
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
diff --git a/retro/SKILL.md b/retro/SKILL.md
index 39b7ee13..c7781525 100644
--- a/retro/SKILL.md
+++ b/retro/SKILL.md
@@ -25,6 +25,8 @@ touch ~/.gstack/sessions/"$PPID"
 _SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
 find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
@@ -32,12 +34,12 @@ If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/g
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
-1. Context: project name, current branch, what we're working on (1-2 sentences)
-2. The specific question or decision point
-3. `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. Lettered options: `A) ... B) ... C) ...`
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
 
-If `_SESSIONS` is 3 or more: the user is juggling multiple gstack sessions and context-switching heavily. **ELI16 mode** — they may not remember what this conversation is about. Every AskUserQuestion MUST re-ground them: state the project, the branch, the current plan/task, then the specific problem, THEN the recommendation and options. Be extra clear and self-contained — assume they haven't looked at this window in 20 minutes.
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
diff --git a/review/SKILL.md b/review/SKILL.md
index b94f8a30..285a4922 100644
--- a/review/SKILL.md
+++ b/review/SKILL.md
@@ -26,6 +26,8 @@ touch ~/.gstack/sessions/"$PPID"
 _SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
 find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
@@ -33,12 +35,12 @@ If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/g
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
-1. Context: project name, current branch, what we're working on (1-2 sentences)
-2. The specific question or decision point
-3. `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. Lettered options: `A) ... B) ... C) ...`
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
 
-If `_SESSIONS` is 3 or more: the user is juggling multiple gstack sessions and context-switching heavily. **ELI16 mode** — they may not remember what this conversation is about. Every AskUserQuestion MUST re-ground them: state the project, the branch, the current plan/task, then the specific problem, THEN the recommendation and options. Be extra clear and self-contained — assume they haven't looked at this window in 20 minutes.
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
diff --git a/scripts/gen-skill-docs.ts b/scripts/gen-skill-docs.ts
index f3d93dbb..9d79189a 100644
--- a/scripts/gen-skill-docs.ts
+++ b/scripts/gen-skill-docs.ts
@@ -105,6 +105,8 @@ touch ~/.gstack/sessions/"$PPID"
 _SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
 find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
 \`\`\`
 
 If output shows \`UPGRADE_AVAILABLE <old> <new>\`: read \`~/.claude/skills/gstack/gstack-upgrade/SKILL.md\` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If \`JUST_UPGRADED <from> <to>\`: tell user "Running gstack v{to} (just updated!)" and continue.
@@ -112,12 +114,12 @@ If output shows \`UPGRADE_AVAILABLE <old> <new>\`: read \`~/.claude/skills/gstac
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
-1. Context: project name, current branch, what we're working on (1-2 sentences)
-2. The specific question or decision point
-3. \`RECOMMENDATION: Choose [X] because [one-line reason]\`
-4. Lettered options: \`A) ... B) ... C) ...\`
+1. **Re-ground:** State the project, the current branch (use the \`_BRANCH\` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** \`RECOMMENDATION: Choose [X] because [one-line reason]\`
+4. **Options:** Lettered options: \`A) ... B) ... C) ...\`
 
-If \`_SESSIONS\` is 3 or more: the user is juggling multiple gstack sessions and context-switching heavily. **ELI16 mode** — they may not remember what this conversation is about. Every AskUserQuestion MUST re-ground them: state the project, the branch, the current plan/task, then the specific problem, THEN the recommendation and options. Be extra clear and self-contained — assume they haven't looked at this window in 20 minutes.
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
diff --git a/setup-browser-cookies/SKILL.md b/setup-browser-cookies/SKILL.md
index d522b270..faebe520 100644
--- a/setup-browser-cookies/SKILL.md
+++ b/setup-browser-cookies/SKILL.md
@@ -23,6 +23,8 @@ touch ~/.gstack/sessions/"$PPID"
 _SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
 find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
@@ -30,12 +32,12 @@ If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/g
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
-1. Context: project name, current branch, what we're working on (1-2 sentences)
-2. The specific question or decision point
-3. `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. Lettered options: `A) ... B) ... C) ...`
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
 
-If `_SESSIONS` is 3 or more: the user is juggling multiple gstack sessions and context-switching heavily. **ELI16 mode** — they may not remember what this conversation is about. Every AskUserQuestion MUST re-ground them: state the project, the branch, the current plan/task, then the specific problem, THEN the recommendation and options. Be extra clear and self-contained — assume they haven't looked at this window in 20 minutes.
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
diff --git a/ship/SKILL.md b/ship/SKILL.md
index 7791f4bc..ee98ecaf 100644
--- a/ship/SKILL.md
+++ b/ship/SKILL.md
@@ -25,6 +25,8 @@ touch ~/.gstack/sessions/"$PPID"
 _SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
 find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
@@ -32,12 +34,12 @@ If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/g
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
-1. Context: project name, current branch, what we're working on (1-2 sentences)
-2. The specific question or decision point
-3. `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. Lettered options: `A) ... B) ... C) ...`
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
 
-If `_SESSIONS` is 3 or more: the user is juggling multiple gstack sessions and context-switching heavily. **ELI16 mode** — they may not remember what this conversation is about. Every AskUserQuestion MUST re-ground them: state the project, the branch, the current plan/task, then the specific problem, THEN the recommendation and options. Be extra clear and self-contained — assume they haven't looked at this window in 20 minutes.
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
diff --git a/test/gen-skill-docs.test.ts b/test/gen-skill-docs.test.ts
index e77989f0..7ec8b280 100644
--- a/test/gen-skill-docs.test.ts
+++ b/test/gen-skill-docs.test.ts
@@ -144,7 +144,18 @@ describe('gen-skill-docs', () => {
     const content = fs.readFileSync(path.join(ROOT, 'SKILL.md'), 'utf-8');
     expect(content).toContain('_SESSIONS');
     expect(content).toContain('RECOMMENDATION');
-    expect(content).toContain('ELI16');
+  });
+
+  test('generated SKILL.md contains branch detection', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'SKILL.md'), 'utf-8');
+    expect(content).toContain('_BRANCH');
+    expect(content).toContain('git branch --show-current');
+  });
+
+  test('generated SKILL.md contains ELI16 simplification rules', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'SKILL.md'), 'utf-8');
+    expect(content).toContain('No raw function names');
+    expect(content).toContain('plain English');
   });
 
   test('qa and qa-only templates use QA_METHODOLOGY placeholder', () => {
diff --git a/test/skill-validation.test.ts b/test/skill-validation.test.ts
index 3ff5c356..77f09ee0 100644
--- a/test/skill-validation.test.ts
+++ b/test/skill-validation.test.ts
@@ -491,7 +491,7 @@ describe('v0.4.1 preamble features', () => {
     test(`${skill} contains session awareness`, () => {
       const content = fs.readFileSync(path.join(ROOT, skill), 'utf-8');
       expect(content).toContain('_SESSIONS');
-      expect(content).toContain('ELI16');
+      expect(content).toContain('RECOMMENDATION');
     });
   }
 });

From a68244ab57aafd43e83764f603d43291e53aca74 Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Mon, 16 Mar 2026 12:30:22 -0500
Subject: [PATCH 04/22] =?UTF-8?q?feat:=20/document-release=20skill=20?=
 =?UTF-8?q?=E2=80=94=20post-ship=20doc=20updates=20(v0.4.3)=20(#109)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* docs: update project documentation for v0.4.2

- README: skill count 9→10, added /document-release to skills table,
  install/uninstall sections, and dedicated section with example
- CHANGELOG: added /document-release bullet to v0.4.2 entry

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* feat: add /document-release skill with smart VERSION handling

New skill runs after /ship but before PR merge. Reads every doc file,
cross-references the diff, auto-updates factual changes, asks about
risky edits. CHANGELOG clobber protection: never uses Write tool on
CHANGELOG.md, only Edit with exact old_string matches.

Smart VERSION logic: instead of silently skipping already-bumped
versions, compares CHANGELOG entry scope against full diff and asks
if significant uncovered changes exist.

Also fixes gstack-upgrade/SKILL.md missing from skill-check.ts
SKILL_FILES array (existing inconsistency with gen-skill-docs.ts).

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* feat: /review Step 5.6 — documentation staleness check

Review skill now cross-references code changes against doc files.
If a doc describes a feature that changed but the doc wasn't updated,
flags it as INFORMATIONAL with a pointer to /document-release.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* test: /document-release E2E with CHANGELOG clobber guard

E2E test creates a repo with existing CHANGELOG entries, runs
/document-release, and asserts original entries survive. Critical
guardrail against the incident where an agent replaced CHANGELOG
entries during conflict resolution.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* chore: bump to v0.4.3 — /document-release skill

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* chore: regenerate SKILL.md files after merge

* chore: regenerate SKILL.md files after merge

---------

Co-authored-by: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 CHANGELOG.md                   |   1 +
 CLAUDE.md                      |   1 +
 README.md                      |  32 ++-
 TODOS.md                       |  26 ++
 document-release/SKILL.md      | 437 +++++++++++++++++++++++++++++++++
 document-release/SKILL.md.tmpl | 355 ++++++++++++++++++++++++++
 review/SKILL.md                |  14 ++
 review/SKILL.md.tmpl           |  14 ++
 scripts/gen-skill-docs.ts      |   1 +
 scripts/skill-check.ts         |   2 +
 test/skill-e2e.test.ts         | 104 ++++++++
 test/skill-validation.test.ts  |   3 +
 12 files changed, 986 insertions(+), 4 deletions(-)
 create mode 100644 document-release/SKILL.md
 create mode 100644 document-release/SKILL.md.tmpl

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 99b7086c..3c3fcceb 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -2,6 +2,7 @@
 
 ## 0.4.3 — 2026-03-16
 
+- **New `/document-release` skill.** Run it after `/ship` but before merging — it reads every doc file in your project, cross-references the diff, and updates README, ARCHITECTURE, CONTRIBUTING, CHANGELOG, and TODOS to match what you actually shipped. Risky changes get surfaced as questions; everything else is automatic.
 - **Every question is now crystal clear, every time.** You used to need 3+ sessions running before gstack would give you full context and plain English explanations. Now every question — even in a single session — tells you the project, branch, and what's happening, explained simply enough to understand mid-context-switch. No more "sorry, explain it to me more simply."
 - **Branch name is always correct.** gstack now detects your current branch at runtime instead of relying on the snapshot from when the conversation started. Switch branches mid-session? gstack keeps up.
 
diff --git a/CLAUDE.md b/CLAUDE.md
index 6f12deae..85a7cda3 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -48,6 +48,7 @@ gstack/
 ├── plan-ceo-review/ # /plan-ceo-review skill
 ├── plan-eng-review/ # /plan-eng-review skill
 ├── retro/           # Retrospective skill
+├── document-release/ # /document-release skill (post-ship doc updates)
 ├── setup            # One-time setup: build binary + symlink skills
 ├── SKILL.md         # Generated from SKILL.md.tmpl (don't edit directly)
 ├── SKILL.md.tmpl    # Template: edit this, run gen:skill-docs
diff --git a/README.md b/README.md
index ce994a45..2b87d178 100644
--- a/README.md
+++ b/README.md
@@ -2,7 +2,7 @@
 
 **gstack turns Claude Code from one generic assistant into a team of specialists you can summon on demand.**
 
-Nine opinionated workflow skills for [Claude Code](https://docs.anthropic.com/en/docs/claude-code). Plan review, code review, one-command shipping, browser automation, QA testing, and engineering retrospectives — all as slash commands.
+Ten opinionated workflow skills for [Claude Code](https://docs.anthropic.com/en/docs/claude-code). Plan review, code review, one-command shipping, browser automation, QA testing, engineering retrospectives, and post-ship documentation — all as slash commands.
 
 ### Without gstack
 
@@ -26,6 +26,7 @@ Nine opinionated workflow skills for [Claude Code](https://docs.anthropic.com/en
 | `/qa-only` | QA reporter | Report-only QA testing. Same methodology as /qa but never fixes anything. Use when you want a pure bug report without code changes. |
 | `/setup-browser-cookies` | Session manager | Import cookies from your real browser (Comet, Chrome, Arc, Brave, Edge) into the headless session. Test authenticated pages without logging in manually. |
 | `/retro` | Engineering manager | Team-aware retro: your deep-dive + per-person praise and growth opportunities for every contributor. |
+| `/document-release` | Technical writer | Update README, ARCHITECTURE, CONTRIBUTING, and project docs to match what you just shipped. |
 
 ## Demo: one feature, five modes
 
@@ -104,11 +105,11 @@ This is the setup I use. One person, ten parallel agents, each with the right co
 
 Open Claude Code and paste this. Claude will do the rest.
 
-> Install gstack: run `git clone https://github.com/garrytan/gstack.git ~/.claude/skills/gstack && cd ~/.claude/skills/gstack && ./setup` then add a "gstack" section to CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, and lists the available skills: /plan-ceo-review, /plan-eng-review, /review, /ship, /browse, /qa, /qa-only, /setup-browser-cookies, /retro. Then ask the user if they also want to add gstack to the current project so teammates get it.
+> Install gstack: run `git clone https://github.com/garrytan/gstack.git ~/.claude/skills/gstack && cd ~/.claude/skills/gstack && ./setup` then add a "gstack" section to CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, and lists the available skills: /plan-ceo-review, /plan-eng-review, /review, /ship, /browse, /qa, /qa-only, /setup-browser-cookies, /retro, /document-release. Then ask the user if they also want to add gstack to the current project so teammates get it.
 
 ### Step 2: Add to your repo so teammates get it (optional)
 
-> Add gstack to this project: run `cp -Rf ~/.claude/skills/gstack .claude/skills/gstack && rm -rf .claude/skills/gstack/.git && cd .claude/skills/gstack && ./setup` then add a "gstack" section to this project's CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, lists the available skills: /plan-ceo-review, /plan-eng-review, /review, /ship, /browse, /qa, /setup-browser-cookies, /retro, and tells Claude that if gstack skills aren't working, run `cd .claude/skills/gstack && ./setup` to build the binary and register skills.
+> Add gstack to this project: run `cp -Rf ~/.claude/skills/gstack .claude/skills/gstack && rm -rf .claude/skills/gstack/.git && cd .claude/skills/gstack && ./setup` then add a "gstack" section to this project's CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, lists the available skills: /plan-ceo-review, /plan-eng-review, /review, /ship, /browse, /qa, /setup-browser-cookies, /retro, /document-release, and tells Claude that if gstack skills aren't working, run `cd .claude/skills/gstack && ./setup` to build the binary and register skills.
 
 Real files get committed to your repo (not a submodule), so `git clone` just works. The binary and node\_modules are gitignored — teammates just need to run `cd .claude/skills/gstack && ./setup` once to build (or `/browse` handles it automatically on first use).
 
@@ -590,6 +591,29 @@ It saves a JSON snapshot to `.context/retros/` so the next run can show trends.
 
 ---
 
+## `/document-release`
+
+This is my **technical writer mode**.
+
+After `/ship` creates the PR but before it merges, `/document-release` reads every documentation file in the project and cross-references it against the diff. It updates file paths, command lists, project structure trees, and anything else that drifted. Risky or subjective changes get surfaced as questions — everything else is handled automatically.
+
+```
+You:   /document-release
+
+Claude: Analyzing 21 files changed across 3 commits. Found 8 documentation files.
+
+        README.md: updated skill count from 9 to 10, added new skill to table
+        CLAUDE.md: added new directory to project structure
+        CONTRIBUTING.md: current — no changes needed
+        TODOS.md: marked 2 items complete, added 1 new item
+
+        All docs updated and committed. PR body updated with doc diff.
+```
+
+It also polishes CHANGELOG voice (without ever overwriting entries), cleans up completed TODOS, checks cross-doc consistency, and asks about VERSION bumps only when appropriate.
+
+---
+
 ## Troubleshooting
 
 **Skill not showing up in Claude Code?**
@@ -614,7 +638,7 @@ Or set `auto_upgrade: true` in `~/.gstack/config.yaml` to upgrade automatically
 
 Paste this into Claude Code:
 
-> Uninstall gstack: remove the skill symlinks by running `for s in browse plan-ceo-review plan-eng-review review ship retro qa qa-only setup-browser-cookies; do rm -f ~/.claude/skills/$s; done` then run `rm -rf ~/.claude/skills/gstack` and remove the gstack section from CLAUDE.md. If this project also has gstack at .claude/skills/gstack, remove it by running `for s in browse plan-ceo-review plan-eng-review review ship retro qa qa-only setup-browser-cookies; do rm -f .claude/skills/$s; done && rm -rf .claude/skills/gstack` and remove the gstack section from the project CLAUDE.md too.
+> Uninstall gstack: remove the skill symlinks by running `for s in browse plan-ceo-review plan-eng-review review ship retro qa qa-only setup-browser-cookies document-release; do rm -f ~/.claude/skills/$s; done` then run `rm -rf ~/.claude/skills/gstack` and remove the gstack section from CLAUDE.md. If this project also has gstack at .claude/skills/gstack, remove it by running `for s in browse plan-ceo-review plan-eng-review review ship retro qa qa-only setup-browser-cookies document-release; do rm -f .claude/skills/$s; done && rm -rf .claude/skills/gstack` and remove the gstack section from the project CLAUDE.md too.
 
 ## Development
 
diff --git a/TODOS.md b/TODOS.md
index 7bd1176a..d2f9282e 100644
--- a/TODOS.md
+++ b/TODOS.md
@@ -374,6 +374,32 @@
 **Priority:** P3
 **Depends on:** Ref staleness Parts 1+2 (shipped)
 
+## Document-Release
+
+### Auto-invoke /document-release from /ship
+
+**What:** Add Step 8.5 to /ship that reads document-release/SKILL.md and executes the doc update workflow after creating the PR.
+
+**Why:** Zero-friction doc updates — user runs /ship and docs are automatically current. No extra command to remember.
+
+**Context:** /ship currently ends at Step 8 (PR URL output). Step 8.5 would continue into the document-release workflow. Same pattern as /ship calling /review's checklist in Step 3.5.
+
+**Effort:** S
+**Priority:** P1
+**Depends on:** /document-release shipped
+
+### `{{DOC_VOICE}}` shared resolver
+
+**What:** Create a placeholder resolver in gen-skill-docs.ts encoding the gstack voice guide (friendly, user-forward, lead with benefits). Inject into /ship Step 5, /document-release Step 5, and reference from CLAUDE.md.
+
+**Why:** DRY — voice rules currently live inline in 3 places (CLAUDE.md CHANGELOG style section, /ship Step 5, /document-release Step 5). When the voice evolves, all three drift.
+
+**Context:** Same pattern as `{{QA_METHODOLOGY}}` — shared block injected into multiple templates to prevent drift. ~20 lines in gen-skill-docs.ts.
+
+**Effort:** S
+**Priority:** P2
+**Depends on:** None
+
 ## Completed
 
 ### Phase 1: Foundations (v0.2.0)
diff --git a/document-release/SKILL.md b/document-release/SKILL.md
new file mode 100644
index 00000000..694d64da
--- /dev/null
+++ b/document-release/SKILL.md
@@ -0,0 +1,437 @@
+---
+name: document-release
+version: 1.0.0
+description: |
+  Post-ship documentation update. Reads all project docs, cross-references the
+  diff, updates README/ARCHITECTURE/CONTRIBUTING/CLAUDE.md to match what shipped,
+  polishes CHANGELOG voice, cleans up TODOS, and optionally bumps VERSION.
+allowed-tools:
+  - Bash
+  - Read
+  - Write
+  - Edit
+  - Grep
+  - Glob
+  - AskUserQuestion
+---
+<!-- AUTO-GENERATED from SKILL.md.tmpl — do not edit directly -->
+<!-- Regenerate: bun run gen:skill-docs -->
+
+## Preamble (run first)
+
+```bash
+_UPD=$(~/.claude/skills/gstack/bin/gstack-update-check 2>/dev/null || .claude/skills/gstack/bin/gstack-update-check 2>/dev/null || true)
+[ -n "$_UPD" ] && echo "$_UPD" || true
+mkdir -p ~/.gstack/sessions
+touch ~/.gstack/sessions/"$PPID"
+_SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
+find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
+_CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
+```
+
+If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
+
+## AskUserQuestion Format
+
+**ALWAYS follow this structure for every AskUserQuestion call:**
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
+
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
+
+Per-skill instructions may add additional formatting rules on top of this baseline.
+
+## Contributor Mode
+
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
+
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
+
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
+
+```
+# {Title}
+
+Hey gstack team — ran into this while using /{skill-name}:
+
+**What I was trying to do:** {what the user/agent was attempting}
+**What happened instead:** {what actually happened}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
+
+## Steps to reproduce
+1. {step}
+
+## Raw output
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
+
+**Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
+```
+
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+
+## Step 0: Detect base branch
+
+Determine which branch this PR targets. Use the result as "the base branch" in all subsequent steps.
+
+1. Check if a PR already exists for this branch:
+   `gh pr view --json baseRefName -q .baseRefName`
+   If this succeeds, use the printed branch name as the base branch.
+
+2. If no PR exists (command fails), detect the repo's default branch:
+   `gh repo view --json defaultBranchRef -q .defaultBranchRef.name`
+
+3. If both commands fail, fall back to `main`.
+
+Print the detected base branch name. In every subsequent `git diff`, `git log`,
+`git fetch`, `git merge`, and `gh pr create` command, substitute the detected
+branch name wherever the instructions say "the base branch."
+
+---
+
+# Document Release: Post-Ship Documentation Update
+
+You are running the `/document-release` workflow. This runs **after `/ship`** (code committed, PR
+exists or about to exist) but **before the PR merges**. Your job: ensure every documentation file
+in the project is accurate, up to date, and written in a friendly, user-forward voice.
+
+You are mostly automated. Make obvious factual updates directly. Stop and ask only for risky or
+subjective decisions.
+
+**Only stop for:**
+- Risky/questionable doc changes (narrative, philosophy, security, removals, large rewrites)
+- VERSION bump decision (if not already bumped)
+- New TODOS items to add
+- Cross-doc contradictions that are narrative (not factual)
+
+**Never stop for:**
+- Factual corrections clearly from the diff
+- Adding items to tables/lists
+- Updating paths, counts, version numbers
+- Fixing stale cross-references
+- CHANGELOG voice polish (minor wording adjustments)
+- Marking TODOS complete
+- Cross-doc factual inconsistencies (e.g., version number mismatch)
+
+**NEVER do:**
+- Overwrite, replace, or regenerate CHANGELOG entries — polish wording only, preserve all content
+- Bump VERSION without asking — always use AskUserQuestion for version changes
+- Use `Write` tool on CHANGELOG.md — always use `Edit` with exact `old_string` matches
+
+---
+
+## Step 1: Pre-flight & Diff Analysis
+
+1. Check the current branch. If on the base branch, **abort**: "You're on the base branch. Run from a feature branch."
+
+2. Gather context about what changed:
+
+```bash
+git diff <base>...HEAD --stat
+```
+
+```bash
+git log <base>..HEAD --oneline
+```
+
+```bash
+git diff <base>...HEAD --name-only
+```
+
+3. Discover all documentation files in the repo:
+
+```bash
+find . -maxdepth 2 -name "*.md" -not -path "./.git/*" -not -path "./node_modules/*" -not -path "./.gstack/*" -not -path "./.context/*" | sort
+```
+
+4. Classify the changes into categories relevant to documentation:
+   - **New features** — new files, new commands, new skills, new capabilities
+   - **Changed behavior** — modified services, updated APIs, config changes
+   - **Removed functionality** — deleted files, removed commands
+   - **Infrastructure** — build system, test infrastructure, CI
+
+5. Output a brief summary: "Analyzing N files changed across M commits. Found K documentation files to review."
+
+---
+
+## Step 2: Per-File Documentation Audit
+
+Read each documentation file and cross-reference it against the diff. Use these generic heuristics
+(adapt to whatever project you're in — these are not gstack-specific):
+
+**README.md:**
+- Does it describe all features and capabilities visible in the diff?
+- Are install/setup instructions consistent with the changes?
+- Are examples, demos, and usage descriptions still valid?
+- Are troubleshooting steps still accurate?
+
+**ARCHITECTURE.md:**
+- Do ASCII diagrams and component descriptions match the current code?
+- Are design decisions and "why" explanations still accurate?
+- Be conservative — only update things clearly contradicted by the diff. Architecture docs
+  describe things unlikely to change frequently.
+
+**CONTRIBUTING.md — New contributor smoke test:**
+- Walk through the setup instructions as if you are a brand new contributor.
+- Are the listed commands accurate? Would each step succeed?
+- Do test tier descriptions match the current test infrastructure?
+- Are workflow descriptions (dev setup, contributor mode, etc.) current?
+- Flag anything that would fail or confuse a first-time contributor.
+
+**CLAUDE.md / project instructions:**
+- Does the project structure section match the actual file tree?
+- Are listed commands and scripts accurate?
+- Do build/test instructions match what's in package.json (or equivalent)?
+
+**Any other .md files:**
+- Read the file, determine its purpose and audience.
+- Cross-reference against the diff to check if it contradicts anything the file says.
+
+For each file, classify needed updates as:
+
+- **Auto-update** — Factual corrections clearly warranted by the diff: adding an item to a
+  table, updating a file path, fixing a count, updating a project structure tree.
+- **Ask user** — Narrative changes, section removal, security model changes, large rewrites
+  (more than ~10 lines in one section), ambiguous relevance, adding entirely new sections.
+
+---
+
+## Step 3: Apply Auto-Updates
+
+Make all clear, factual updates directly using the Edit tool.
+
+For each file modified, output a one-line summary describing **what specifically changed** — not
+just "Updated README.md" but "README.md: added /new-skill to skills table, updated skill count
+from 9 to 10."
+
+**Never auto-update:**
+- README introduction or project positioning
+- ARCHITECTURE philosophy or design rationale
+- Security model descriptions
+- Do not remove entire sections from any document
+
+---
+
+## Step 4: Ask About Risky/Questionable Changes
+
+For each risky or questionable update identified in Step 2, use AskUserQuestion with:
+- Context: project name, branch, which doc file, what we're reviewing
+- The specific documentation decision
+- `RECOMMENDATION: Choose [X] because [one-line reason]`
+- Options including C) Skip — leave as-is
+
+Apply approved changes immediately after each answer.
+
+---
+
+## Step 5: CHANGELOG Voice Polish
+
+**CRITICAL — NEVER CLOBBER CHANGELOG ENTRIES.**
+
+This step polishes voice. It does NOT rewrite, replace, or regenerate CHANGELOG content.
+
+A real incident occurred where an agent replaced existing CHANGELOG entries when it should have
+preserved them. This skill must NEVER do that.
+
+**Rules:**
+1. Read the entire CHANGELOG.md first. Understand what is already there.
+2. Only modify wording within existing entries. Never delete, reorder, or replace entries.
+3. Never regenerate a CHANGELOG entry from scratch. The entry was written by `/ship` from the
+   actual diff and commit history. It is the source of truth. You are polishing prose, not
+   rewriting history.
+4. If an entry looks wrong or incomplete, use AskUserQuestion — do NOT silently fix it.
+5. Use Edit tool with exact `old_string` matches — never use Write to overwrite CHANGELOG.md.
+
+**If CHANGELOG was not modified in this branch:** skip this step.
+
+**If CHANGELOG was modified in this branch**, review the entry for voice:
+
+- **Sell test:** Would a user reading each bullet think "oh nice, I want to try that"? If not,
+  rewrite the wording (not the content).
+- Lead with what the user can now **do** — not implementation details.
+- "You can now..." not "Refactored the..."
+- Flag and rewrite any entry that reads like a commit message.
+- Internal/contributor changes belong in a separate "### For contributors" subsection.
+- Auto-fix minor voice adjustments. Use AskUserQuestion if a rewrite would alter meaning.
+
+---
+
+## Step 6: Cross-Doc Consistency & Discoverability Check
+
+After auditing each file individually, do a cross-doc consistency pass:
+
+1. Does the README's feature/capability list match what CLAUDE.md (or project instructions) describes?
+2. Does ARCHITECTURE's component list match CONTRIBUTING's project structure description?
+3. Does CHANGELOG's latest version match the VERSION file?
+4. **Discoverability:** Is every documentation file reachable from README.md or CLAUDE.md? If
+   ARCHITECTURE.md exists but neither README nor CLAUDE.md links to it, flag it. Every doc
+   should be discoverable from one of the two entry-point files.
+5. Flag any contradictions between documents. Auto-fix clear factual inconsistencies (e.g., a
+   version mismatch). Use AskUserQuestion for narrative contradictions.
+
+---
+
+## Step 7: TODOS.md Cleanup
+
+This is a second pass that complements `/ship`'s Step 5.5. Read `review/TODOS-format.md` (if
+available) for the canonical TODO item format.
+
+If TODOS.md does not exist, skip this step.
+
+1. **Completed items not yet marked:** Cross-reference the diff against open TODO items. If a
+   TODO is clearly completed by the changes in this branch, move it to the Completed section
+   with `**Completed:** vX.Y.Z.W (YYYY-MM-DD)`. Be conservative — only mark items with clear
+   evidence in the diff.
+
+2. **Items needing description updates:** If a TODO references files or components that were
+   significantly changed, its description may be stale. Use AskUserQuestion to confirm whether
+   the TODO should be updated, completed, or left as-is.
+
+3. **New deferred work:** Check the diff for `TODO`, `FIXME`, `HACK`, and `XXX` comments. For
+   each one that represents meaningful deferred work (not a trivial inline note), use
+   AskUserQuestion to ask whether it should be captured in TODOS.md.
+
+---
+
+## Step 8: VERSION Bump Question
+
+**CRITICAL — NEVER BUMP VERSION WITHOUT ASKING.**
+
+1. **If VERSION does not exist:** Skip silently.
+
+2. Check if VERSION was already modified on this branch:
+
+```bash
+git diff <base>...HEAD -- VERSION
+```
+
+3. **If VERSION was NOT bumped:** Use AskUserQuestion:
+   - RECOMMENDATION: Choose C (Skip) because docs-only changes rarely warrant a version bump
+   - A) Bump PATCH (X.Y.Z+1) — if doc changes ship alongside code changes
+   - B) Bump MINOR (X.Y+1.0) — if this is a significant standalone release
+   - C) Skip — no version bump needed
+
+4. **If VERSION was already bumped:** Do NOT skip silently. Instead, check whether the bump
+   still covers the full scope of changes on this branch:
+
+   a. Read the CHANGELOG entry for the current VERSION. What features does it describe?
+   b. Read the full diff (`git diff <base>...HEAD --stat` and `git diff <base>...HEAD --name-only`).
+      Are there significant changes (new features, new skills, new commands, major refactors)
+      that are NOT mentioned in the CHANGELOG entry for the current version?
+   c. **If the CHANGELOG entry covers everything:** Skip — output "VERSION: Already bumped to
+      vX.Y.Z, covers all changes."
+   d. **If there are significant uncovered changes:** Use AskUserQuestion explaining what the
+      current version covers vs what's new, and ask:
+      - RECOMMENDATION: Choose A because the new changes warrant their own version
+      - A) Bump to next patch (X.Y.Z+1) — give the new changes their own version
+      - B) Keep current version — add new changes to the existing CHANGELOG entry
+      - C) Skip — leave version as-is, handle later
+
+   The key insight: a VERSION bump set for "feature A" should not silently absorb "feature B"
+   if feature B is substantial enough to deserve its own version entry.
+
+---
+
+## Step 9: Commit & Output
+
+**Empty check first:** Run `git status` (never use `-uall`). If no documentation files were
+modified by any previous step, output "All documentation is up to date." and exit without
+committing.
+
+**Commit:**
+
+1. Stage modified documentation files by name (never `git add -A` or `git add .`).
+2. Create a single commit:
+
+```bash
+git commit -m "$(cat <<'EOF'
+docs: update project documentation for vX.Y.Z.W
+
+Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
+EOF
+)"
+```
+
+3. Push to the current branch:
+
+```bash
+git push
+```
+
+**PR body update (idempotent, race-safe):**
+
+1. Read the existing PR body into a PID-unique tempfile:
+
+```bash
+gh pr view --json body -q .body > /tmp/gstack-pr-body-$$.md
+```
+
+2. If the tempfile already contains a `## Documentation` section, replace that section with the
+   updated content. If it does not contain one, append a `## Documentation` section at the end.
+
+3. The Documentation section should include a **doc diff preview** — for each file modified,
+   describe what specifically changed (e.g., "README.md: added /document-release to skills
+   table, updated skill count from 9 to 10").
+
+4. Write the updated body back:
+
+```bash
+gh pr edit --body-file /tmp/gstack-pr-body-$$.md
+```
+
+5. Clean up the tempfile:
+
+```bash
+rm -f /tmp/gstack-pr-body-$$.md
+```
+
+6. If `gh pr view` fails (no PR exists): skip with message "No PR found — skipping body update."
+7. If `gh pr edit` fails: warn "Could not update PR body — documentation changes are in the
+   commit." and continue.
+
+**Structured doc health summary (final output):**
+
+Output a scannable summary showing every documentation file's status:
+
+```
+Documentation health:
+  README.md       [status] ([details])
+  ARCHITECTURE.md [status] ([details])
+  CONTRIBUTING.md [status] ([details])
+  CHANGELOG.md    [status] ([details])
+  TODOS.md        [status] ([details])
+  VERSION         [status] ([details])
+```
+
+Where status is one of:
+- Updated — with description of what changed
+- Current — no changes needed
+- Voice polished — wording adjusted
+- Not bumped — user chose to skip
+- Already bumped — version was set by /ship
+- Skipped — file does not exist
+
+---
+
+## Important Rules
+
+- **Read before editing.** Always read the full content of a file before modifying it.
+- **Never clobber CHANGELOG.** Polish wording only. Never delete, replace, or regenerate entries.
+- **Never bump VERSION silently.** Always ask. Even if already bumped, check whether it covers the full scope of changes.
+- **Be explicit about what changed.** Every edit gets a one-line summary.
+- **Generic heuristics, not project-specific.** The audit checks work on any repo.
+- **Discoverability matters.** Every doc file should be reachable from README or CLAUDE.md.
+- **Voice: friendly, user-forward, not obscure.** Write like you're explaining to a smart person
+  who hasn't seen the code.
diff --git a/document-release/SKILL.md.tmpl b/document-release/SKILL.md.tmpl
new file mode 100644
index 00000000..e38c243c
--- /dev/null
+++ b/document-release/SKILL.md.tmpl
@@ -0,0 +1,355 @@
+---
+name: document-release
+version: 1.0.0
+description: |
+  Post-ship documentation update. Reads all project docs, cross-references the
+  diff, updates README/ARCHITECTURE/CONTRIBUTING/CLAUDE.md to match what shipped,
+  polishes CHANGELOG voice, cleans up TODOS, and optionally bumps VERSION.
+allowed-tools:
+  - Bash
+  - Read
+  - Write
+  - Edit
+  - Grep
+  - Glob
+  - AskUserQuestion
+---
+
+{{PREAMBLE}}
+
+{{BASE_BRANCH_DETECT}}
+
+# Document Release: Post-Ship Documentation Update
+
+You are running the `/document-release` workflow. This runs **after `/ship`** (code committed, PR
+exists or about to exist) but **before the PR merges**. Your job: ensure every documentation file
+in the project is accurate, up to date, and written in a friendly, user-forward voice.
+
+You are mostly automated. Make obvious factual updates directly. Stop and ask only for risky or
+subjective decisions.
+
+**Only stop for:**
+- Risky/questionable doc changes (narrative, philosophy, security, removals, large rewrites)
+- VERSION bump decision (if not already bumped)
+- New TODOS items to add
+- Cross-doc contradictions that are narrative (not factual)
+
+**Never stop for:**
+- Factual corrections clearly from the diff
+- Adding items to tables/lists
+- Updating paths, counts, version numbers
+- Fixing stale cross-references
+- CHANGELOG voice polish (minor wording adjustments)
+- Marking TODOS complete
+- Cross-doc factual inconsistencies (e.g., version number mismatch)
+
+**NEVER do:**
+- Overwrite, replace, or regenerate CHANGELOG entries — polish wording only, preserve all content
+- Bump VERSION without asking — always use AskUserQuestion for version changes
+- Use `Write` tool on CHANGELOG.md — always use `Edit` with exact `old_string` matches
+
+---
+
+## Step 1: Pre-flight & Diff Analysis
+
+1. Check the current branch. If on the base branch, **abort**: "You're on the base branch. Run from a feature branch."
+
+2. Gather context about what changed:
+
+```bash
+git diff <base>...HEAD --stat
+```
+
+```bash
+git log <base>..HEAD --oneline
+```
+
+```bash
+git diff <base>...HEAD --name-only
+```
+
+3. Discover all documentation files in the repo:
+
+```bash
+find . -maxdepth 2 -name "*.md" -not -path "./.git/*" -not -path "./node_modules/*" -not -path "./.gstack/*" -not -path "./.context/*" | sort
+```
+
+4. Classify the changes into categories relevant to documentation:
+   - **New features** — new files, new commands, new skills, new capabilities
+   - **Changed behavior** — modified services, updated APIs, config changes
+   - **Removed functionality** — deleted files, removed commands
+   - **Infrastructure** — build system, test infrastructure, CI
+
+5. Output a brief summary: "Analyzing N files changed across M commits. Found K documentation files to review."
+
+---
+
+## Step 2: Per-File Documentation Audit
+
+Read each documentation file and cross-reference it against the diff. Use these generic heuristics
+(adapt to whatever project you're in — these are not gstack-specific):
+
+**README.md:**
+- Does it describe all features and capabilities visible in the diff?
+- Are install/setup instructions consistent with the changes?
+- Are examples, demos, and usage descriptions still valid?
+- Are troubleshooting steps still accurate?
+
+**ARCHITECTURE.md:**
+- Do ASCII diagrams and component descriptions match the current code?
+- Are design decisions and "why" explanations still accurate?
+- Be conservative — only update things clearly contradicted by the diff. Architecture docs
+  describe things unlikely to change frequently.
+
+**CONTRIBUTING.md — New contributor smoke test:**
+- Walk through the setup instructions as if you are a brand new contributor.
+- Are the listed commands accurate? Would each step succeed?
+- Do test tier descriptions match the current test infrastructure?
+- Are workflow descriptions (dev setup, contributor mode, etc.) current?
+- Flag anything that would fail or confuse a first-time contributor.
+
+**CLAUDE.md / project instructions:**
+- Does the project structure section match the actual file tree?
+- Are listed commands and scripts accurate?
+- Do build/test instructions match what's in package.json (or equivalent)?
+
+**Any other .md files:**
+- Read the file, determine its purpose and audience.
+- Cross-reference against the diff to check if it contradicts anything the file says.
+
+For each file, classify needed updates as:
+
+- **Auto-update** — Factual corrections clearly warranted by the diff: adding an item to a
+  table, updating a file path, fixing a count, updating a project structure tree.
+- **Ask user** — Narrative changes, section removal, security model changes, large rewrites
+  (more than ~10 lines in one section), ambiguous relevance, adding entirely new sections.
+
+---
+
+## Step 3: Apply Auto-Updates
+
+Make all clear, factual updates directly using the Edit tool.
+
+For each file modified, output a one-line summary describing **what specifically changed** — not
+just "Updated README.md" but "README.md: added /new-skill to skills table, updated skill count
+from 9 to 10."
+
+**Never auto-update:**
+- README introduction or project positioning
+- ARCHITECTURE philosophy or design rationale
+- Security model descriptions
+- Do not remove entire sections from any document
+
+---
+
+## Step 4: Ask About Risky/Questionable Changes
+
+For each risky or questionable update identified in Step 2, use AskUserQuestion with:
+- Context: project name, branch, which doc file, what we're reviewing
+- The specific documentation decision
+- `RECOMMENDATION: Choose [X] because [one-line reason]`
+- Options including C) Skip — leave as-is
+
+Apply approved changes immediately after each answer.
+
+---
+
+## Step 5: CHANGELOG Voice Polish
+
+**CRITICAL — NEVER CLOBBER CHANGELOG ENTRIES.**
+
+This step polishes voice. It does NOT rewrite, replace, or regenerate CHANGELOG content.
+
+A real incident occurred where an agent replaced existing CHANGELOG entries when it should have
+preserved them. This skill must NEVER do that.
+
+**Rules:**
+1. Read the entire CHANGELOG.md first. Understand what is already there.
+2. Only modify wording within existing entries. Never delete, reorder, or replace entries.
+3. Never regenerate a CHANGELOG entry from scratch. The entry was written by `/ship` from the
+   actual diff and commit history. It is the source of truth. You are polishing prose, not
+   rewriting history.
+4. If an entry looks wrong or incomplete, use AskUserQuestion — do NOT silently fix it.
+5. Use Edit tool with exact `old_string` matches — never use Write to overwrite CHANGELOG.md.
+
+**If CHANGELOG was not modified in this branch:** skip this step.
+
+**If CHANGELOG was modified in this branch**, review the entry for voice:
+
+- **Sell test:** Would a user reading each bullet think "oh nice, I want to try that"? If not,
+  rewrite the wording (not the content).
+- Lead with what the user can now **do** — not implementation details.
+- "You can now..." not "Refactored the..."
+- Flag and rewrite any entry that reads like a commit message.
+- Internal/contributor changes belong in a separate "### For contributors" subsection.
+- Auto-fix minor voice adjustments. Use AskUserQuestion if a rewrite would alter meaning.
+
+---
+
+## Step 6: Cross-Doc Consistency & Discoverability Check
+
+After auditing each file individually, do a cross-doc consistency pass:
+
+1. Does the README's feature/capability list match what CLAUDE.md (or project instructions) describes?
+2. Does ARCHITECTURE's component list match CONTRIBUTING's project structure description?
+3. Does CHANGELOG's latest version match the VERSION file?
+4. **Discoverability:** Is every documentation file reachable from README.md or CLAUDE.md? If
+   ARCHITECTURE.md exists but neither README nor CLAUDE.md links to it, flag it. Every doc
+   should be discoverable from one of the two entry-point files.
+5. Flag any contradictions between documents. Auto-fix clear factual inconsistencies (e.g., a
+   version mismatch). Use AskUserQuestion for narrative contradictions.
+
+---
+
+## Step 7: TODOS.md Cleanup
+
+This is a second pass that complements `/ship`'s Step 5.5. Read `review/TODOS-format.md` (if
+available) for the canonical TODO item format.
+
+If TODOS.md does not exist, skip this step.
+
+1. **Completed items not yet marked:** Cross-reference the diff against open TODO items. If a
+   TODO is clearly completed by the changes in this branch, move it to the Completed section
+   with `**Completed:** vX.Y.Z.W (YYYY-MM-DD)`. Be conservative — only mark items with clear
+   evidence in the diff.
+
+2. **Items needing description updates:** If a TODO references files or components that were
+   significantly changed, its description may be stale. Use AskUserQuestion to confirm whether
+   the TODO should be updated, completed, or left as-is.
+
+3. **New deferred work:** Check the diff for `TODO`, `FIXME`, `HACK`, and `XXX` comments. For
+   each one that represents meaningful deferred work (not a trivial inline note), use
+   AskUserQuestion to ask whether it should be captured in TODOS.md.
+
+---
+
+## Step 8: VERSION Bump Question
+
+**CRITICAL — NEVER BUMP VERSION WITHOUT ASKING.**
+
+1. **If VERSION does not exist:** Skip silently.
+
+2. Check if VERSION was already modified on this branch:
+
+```bash
+git diff <base>...HEAD -- VERSION
+```
+
+3. **If VERSION was NOT bumped:** Use AskUserQuestion:
+   - RECOMMENDATION: Choose C (Skip) because docs-only changes rarely warrant a version bump
+   - A) Bump PATCH (X.Y.Z+1) — if doc changes ship alongside code changes
+   - B) Bump MINOR (X.Y+1.0) — if this is a significant standalone release
+   - C) Skip — no version bump needed
+
+4. **If VERSION was already bumped:** Do NOT skip silently. Instead, check whether the bump
+   still covers the full scope of changes on this branch:
+
+   a. Read the CHANGELOG entry for the current VERSION. What features does it describe?
+   b. Read the full diff (`git diff <base>...HEAD --stat` and `git diff <base>...HEAD --name-only`).
+      Are there significant changes (new features, new skills, new commands, major refactors)
+      that are NOT mentioned in the CHANGELOG entry for the current version?
+   c. **If the CHANGELOG entry covers everything:** Skip — output "VERSION: Already bumped to
+      vX.Y.Z, covers all changes."
+   d. **If there are significant uncovered changes:** Use AskUserQuestion explaining what the
+      current version covers vs what's new, and ask:
+      - RECOMMENDATION: Choose A because the new changes warrant their own version
+      - A) Bump to next patch (X.Y.Z+1) — give the new changes their own version
+      - B) Keep current version — add new changes to the existing CHANGELOG entry
+      - C) Skip — leave version as-is, handle later
+
+   The key insight: a VERSION bump set for "feature A" should not silently absorb "feature B"
+   if feature B is substantial enough to deserve its own version entry.
+
+---
+
+## Step 9: Commit & Output
+
+**Empty check first:** Run `git status` (never use `-uall`). If no documentation files were
+modified by any previous step, output "All documentation is up to date." and exit without
+committing.
+
+**Commit:**
+
+1. Stage modified documentation files by name (never `git add -A` or `git add .`).
+2. Create a single commit:
+
+```bash
+git commit -m "$(cat <<'EOF'
+docs: update project documentation for vX.Y.Z.W
+
+Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
+EOF
+)"
+```
+
+3. Push to the current branch:
+
+```bash
+git push
+```
+
+**PR body update (idempotent, race-safe):**
+
+1. Read the existing PR body into a PID-unique tempfile:
+
+```bash
+gh pr view --json body -q .body > /tmp/gstack-pr-body-$$.md
+```
+
+2. If the tempfile already contains a `## Documentation` section, replace that section with the
+   updated content. If it does not contain one, append a `## Documentation` section at the end.
+
+3. The Documentation section should include a **doc diff preview** — for each file modified,
+   describe what specifically changed (e.g., "README.md: added /document-release to skills
+   table, updated skill count from 9 to 10").
+
+4. Write the updated body back:
+
+```bash
+gh pr edit --body-file /tmp/gstack-pr-body-$$.md
+```
+
+5. Clean up the tempfile:
+
+```bash
+rm -f /tmp/gstack-pr-body-$$.md
+```
+
+6. If `gh pr view` fails (no PR exists): skip with message "No PR found — skipping body update."
+7. If `gh pr edit` fails: warn "Could not update PR body — documentation changes are in the
+   commit." and continue.
+
+**Structured doc health summary (final output):**
+
+Output a scannable summary showing every documentation file's status:
+
+```
+Documentation health:
+  README.md       [status] ([details])
+  ARCHITECTURE.md [status] ([details])
+  CONTRIBUTING.md [status] ([details])
+  CHANGELOG.md    [status] ([details])
+  TODOS.md        [status] ([details])
+  VERSION         [status] ([details])
+```
+
+Where status is one of:
+- Updated — with description of what changed
+- Current — no changes needed
+- Voice polished — wording adjusted
+- Not bumped — user chose to skip
+- Already bumped — version was set by /ship
+- Skipped — file does not exist
+
+---
+
+## Important Rules
+
+- **Read before editing.** Always read the full content of a file before modifying it.
+- **Never clobber CHANGELOG.** Polish wording only. Never delete, replace, or regenerate entries.
+- **Never bump VERSION silently.** Always ask. Even if already bumped, check whether it covers the full scope of changes.
+- **Be explicit about what changed.** Every edit gets a one-line summary.
+- **Generic heuristics, not project-specific.** The audit checks work on any repo.
+- **Discoverability matters.** Every doc file should be reachable from README or CLAUDE.md.
+- **Voice: friendly, user-forward, not obscure.** Write like you're explaining to a smart person
+  who hasn't seen the code.
diff --git a/review/SKILL.md b/review/SKILL.md
index 285a4922..c111e57a 100644
--- a/review/SKILL.md
+++ b/review/SKILL.md
@@ -206,6 +206,20 @@ If TODOS.md doesn't exist, skip this step silently.
 
 ---
 
+## Step 5.6: Documentation staleness check
+
+Cross-reference the diff against documentation files. For each `.md` file in the repo root (README.md, ARCHITECTURE.md, CONTRIBUTING.md, CLAUDE.md, etc.):
+
+1. Check if code changes in the diff affect features, components, or workflows described in that doc file.
+2. If the doc file was NOT updated in this branch but the code it describes WAS changed, flag it as an INFORMATIONAL finding:
+   "Documentation may be stale: [file] describes [feature/component] but code changed in this branch. Consider running `/document-release`."
+
+This is informational only — never critical. The fix action is `/document-release`.
+
+If no documentation files exist, skip this step silently.
+
+---
+
 ## Important Rules
 
 - **Read the FULL diff before commenting.** Do not flag issues already addressed in the diff.
diff --git a/review/SKILL.md.tmpl b/review/SKILL.md.tmpl
index dadd211a..f13dae4f 100644
--- a/review/SKILL.md.tmpl
+++ b/review/SKILL.md.tmpl
@@ -124,6 +124,20 @@ If TODOS.md doesn't exist, skip this step silently.
 
 ---
 
+## Step 5.6: Documentation staleness check
+
+Cross-reference the diff against documentation files. For each `.md` file in the repo root (README.md, ARCHITECTURE.md, CONTRIBUTING.md, CLAUDE.md, etc.):
+
+1. Check if code changes in the diff affect features, components, or workflows described in that doc file.
+2. If the doc file was NOT updated in this branch but the code it describes WAS changed, flag it as an INFORMATIONAL finding:
+   "Documentation may be stale: [file] describes [feature/component] but code changed in this branch. Consider running `/document-release`."
+
+This is informational only — never critical. The fix action is `/document-release`.
+
+If no documentation files exist, skip this step silently.
+
+---
+
 ## Important Rules
 
 - **Read the FULL diff before commenting.** Do not flag issues already addressed in the diff.
diff --git a/scripts/gen-skill-docs.ts b/scripts/gen-skill-docs.ts
index 9d79189a..ebe4f54f 100644
--- a/scripts/gen-skill-docs.ts
+++ b/scripts/gen-skill-docs.ts
@@ -539,6 +539,7 @@ function findTemplates(): string[] {
     path.join(ROOT, 'plan-eng-review', 'SKILL.md.tmpl'),
     path.join(ROOT, 'retro', 'SKILL.md.tmpl'),
     path.join(ROOT, 'gstack-upgrade', 'SKILL.md.tmpl'),
+    path.join(ROOT, 'document-release', 'SKILL.md.tmpl'),
   ];
   for (const p of candidates) {
     if (fs.existsSync(p)) templates.push(p);
diff --git a/scripts/skill-check.ts b/scripts/skill-check.ts
index 591a0c81..51a583a2 100644
--- a/scripts/skill-check.ts
+++ b/scripts/skill-check.ts
@@ -27,6 +27,8 @@ const SKILL_FILES = [
   'plan-ceo-review/SKILL.md',
   'plan-eng-review/SKILL.md',
   'setup-browser-cookies/SKILL.md',
+  'gstack-upgrade/SKILL.md',
+  'document-release/SKILL.md',
 ].filter(f => fs.existsSync(path.join(ROOT, f)));
 
 let hasErrors = false;
diff --git a/test/skill-e2e.test.ts b/test/skill-e2e.test.ts
index aa50a976..37b42de8 100644
--- a/test/skill-e2e.test.ts
+++ b/test/skill-e2e.test.ts
@@ -1546,6 +1546,110 @@ Write your retrospective to ${dir}/retro-output.md`,
   }, 300_000);
 });
 
+// --- Document-Release skill E2E ---
+
+describeE2E('Document-Release skill E2E', () => {
+  let docReleaseDir: string;
+
+  beforeAll(() => {
+    docReleaseDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-doc-release-'));
+
+    // Copy document-release skill files
+    copyDirSync(path.join(ROOT, 'document-release'), path.join(docReleaseDir, 'document-release'));
+
+    // Init git repo with initial docs
+    const run = (cmd: string, args: string[]) =>
+      spawnSync(cmd, args, { cwd: docReleaseDir, stdio: 'pipe', timeout: 5000 });
+
+    run('git', ['init']);
+    run('git', ['config', 'user.email', 'test@test.com']);
+    run('git', ['config', 'user.name', 'Test']);
+
+    // Create initial README with a features list
+    fs.writeFileSync(path.join(docReleaseDir, 'README.md'),
+      '# Test Project\n\n## Features\n\n- Feature A\n- Feature B\n\n## Install\n\n```bash\nnpm install\n```\n');
+
+    // Create initial CHANGELOG that must NOT be clobbered
+    fs.writeFileSync(path.join(docReleaseDir, 'CHANGELOG.md'),
+      '# Changelog\n\n## 1.0.0 — 2026-03-01\n\n- Initial release with Feature A and Feature B\n- Setup CI pipeline\n');
+
+    // Create VERSION file (already bumped)
+    fs.writeFileSync(path.join(docReleaseDir, 'VERSION'), '1.1.0\n');
+
+    run('git', ['add', '.']);
+    run('git', ['commit', '-m', 'initial']);
+
+    // Create feature branch with a code change
+    run('git', ['checkout', '-b', 'feat/add-feature-c']);
+    fs.writeFileSync(path.join(docReleaseDir, 'feature-c.ts'), 'export function featureC() { return "C"; }\n');
+    fs.writeFileSync(path.join(docReleaseDir, 'VERSION'), '1.1.1\n');
+    fs.writeFileSync(path.join(docReleaseDir, 'CHANGELOG.md'),
+      '# Changelog\n\n## 1.1.1 — 2026-03-16\n\n- Added Feature C\n\n## 1.0.0 — 2026-03-01\n\n- Initial release with Feature A and Feature B\n- Setup CI pipeline\n');
+    run('git', ['add', '.']);
+    run('git', ['commit', '-m', 'feat: add feature C']);
+  });
+
+  afterAll(() => {
+    try { fs.rmSync(docReleaseDir, { recursive: true, force: true }); } catch {}
+  });
+
+  test('/document-release updates docs without clobbering CHANGELOG', async () => {
+    const result = await runSkillTest({
+      prompt: `Read the file document-release/SKILL.md for the document-release workflow instructions.
+
+Run the /document-release workflow on this repo. The base branch is "main".
+
+IMPORTANT:
+- Do NOT use AskUserQuestion — auto-approve everything or skip if unsure.
+- Do NOT push or create PRs (there is no remote).
+- Do NOT run gh commands (no remote).
+- Focus on updating README.md to reflect the new Feature C.
+- Do NOT overwrite or regenerate CHANGELOG entries.
+- Skip VERSION bump (it's already bumped).
+- After editing, just commit the changes locally.`,
+      workingDirectory: docReleaseDir,
+      maxTurns: 30,
+      allowedTools: ['Bash', 'Read', 'Write', 'Edit', 'Grep', 'Glob'],
+      timeout: 180_000,
+      testName: 'document-release',
+      runId,
+    });
+
+    logCost('/document-release', result);
+
+    // Read CHANGELOG to verify it was NOT clobbered
+    const changelog = fs.readFileSync(path.join(docReleaseDir, 'CHANGELOG.md'), 'utf-8');
+    const hasOriginalEntries = changelog.includes('Initial release with Feature A and Feature B')
+      && changelog.includes('Setup CI pipeline')
+      && changelog.includes('1.0.0');
+    if (!hasOriginalEntries) {
+      console.warn('CHANGELOG CLOBBERED — original entries missing!');
+    }
+
+    // Check if README was updated
+    const readme = fs.readFileSync(path.join(docReleaseDir, 'README.md'), 'utf-8');
+    const readmeUpdated = readme.includes('Feature C') || readme.includes('feature-c') || readme.includes('feature C');
+
+    const exitOk = ['success', 'error_max_turns'].includes(result.exitReason);
+    recordE2E('/document-release', 'Document-Release skill E2E', result, {
+      passed: exitOk && hasOriginalEntries,
+    });
+
+    // Critical guardrail: CHANGELOG must not be clobbered
+    expect(hasOriginalEntries).toBe(true);
+
+    // Accept error_max_turns — thorough doc review is not a failure
+    expect(['success', 'error_max_turns']).toContain(result.exitReason);
+
+    // Informational: did it update README?
+    if (readmeUpdated) {
+      console.log('README updated to include Feature C');
+    } else {
+      console.warn('README was NOT updated — agent may not have found the feature');
+    }
+  }, 240_000);
+});
+
 // --- Deferred skill E2E tests (destructive or require interactive UI) ---
 
 describeE2E('Deferred skill E2E', () => {
diff --git a/test/skill-validation.test.ts b/test/skill-validation.test.ts
index 77f09ee0..a1817ede 100644
--- a/test/skill-validation.test.ts
+++ b/test/skill-validation.test.ts
@@ -176,6 +176,7 @@ describe('Update check preamble', () => {
     'ship/SKILL.md', 'review/SKILL.md',
     'plan-ceo-review/SKILL.md', 'plan-eng-review/SKILL.md',
     'retro/SKILL.md',
+    'document-release/SKILL.md',
   ];
 
   for (const skill of skillsWithUpdateCheck) {
@@ -397,6 +398,7 @@ describe('No hardcoded branch names in SKILL templates', () => {
     'qa/SKILL.md.tmpl',
     'plan-ceo-review/SKILL.md.tmpl',
     'retro/SKILL.md.tmpl',
+    'document-release/SKILL.md.tmpl',
   ];
 
   // Patterns that indicate hardcoded 'main' in git commands
@@ -479,6 +481,7 @@ describe('v0.4.1 preamble features', () => {
     'ship/SKILL.md', 'review/SKILL.md',
     'plan-ceo-review/SKILL.md', 'plan-eng-review/SKILL.md',
     'retro/SKILL.md',
+    'document-release/SKILL.md',
   ];
 
   for (const skill of skillsWithPreamble) {

From c86faa7968688993406fd4c6cd9550d58306408f Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Mon, 16 Mar 2026 14:14:15 -0500
Subject: [PATCH 05/22] =?UTF-8?q?fix:=20update=20check=20cache=20=E2=80=94?=
 =?UTF-8?q?=2060min=20UP=5FTO=5FDATE=20TTL=20+=20--force=20flag=20(v0.4.4)?=
 =?UTF-8?q?=20(#110)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* fix: split update check cache TTL + add --force flag

UP_TO_DATE cache now expires after 60 min (was 720 min / 12 hours).
UPGRADE_AVAILABLE keeps 720 min TTL to keep nagging.

--force flag deletes cache before checking, used by /gstack-upgrade
standalone invocation to always get a fresh result from GitHub.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* feat: /gstack-upgrade standalone uses --force for fresh check

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* chore: bump version and changelog (v0.4.4)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 CHANGELOG.md                            | 11 +++++
 VERSION                                 |  2 +-
 bin/gstack-update-check                 | 27 +++++++-----
 browse/test/gstack-update-check.test.ts | 58 +++++++++++++++++++++++--
 gstack-upgrade/SKILL.md                 | 11 ++++-
 gstack-upgrade/SKILL.md.tmpl            | 11 ++++-
 6 files changed, 104 insertions(+), 16 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 3c3fcceb..d61ba4f2 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,16 @@
 # Changelog
 
+## 0.4.4 — 2026-03-16
+
+- **New releases detected in under an hour, not half a day.** The update check cache was set to 12 hours, which meant you could be stuck on an old version all day while new releases dropped. Now "you're up to date" expires after 60 minutes, so you'll see upgrades within the hour. "Upgrade available" still nags for 12 hours (that's the point).
+- **`/gstack-upgrade` always checks for real.** Running `/gstack-upgrade` directly now bypasses the cache and does a fresh check against GitHub. No more "you're already on the latest" when you're not.
+
+### For contributors
+
+- Split `last-update-check` cache TTL: 60 min for `UP_TO_DATE`, 720 min for `UPGRADE_AVAILABLE`.
+- Added `--force` flag to `bin/gstack-update-check` (deletes cache file before checking).
+- 3 new tests: `--force` busts UP_TO_DATE cache, `--force` busts UPGRADE_AVAILABLE cache, 60-min TTL boundary test with `utimesSync`.
+
 ## 0.4.3 — 2026-03-16
 
 - **New `/document-release` skill.** Run it after `/ship` but before merging — it reads every doc file in your project, cross-references the diff, and updates README, ARCHITECTURE, CONTRIBUTING, CHANGELOG, and TODOS to match what you actually shipped. Risky changes get surfaced as questions; everything else is automatic.
diff --git a/VERSION b/VERSION
index 17b2ccd9..6f2743d6 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.4.3
+0.4.4
diff --git a/bin/gstack-update-check b/bin/gstack-update-check
index 7c5e5ca0..d44c7e0f 100755
--- a/bin/gstack-update-check
+++ b/bin/gstack-update-check
@@ -20,6 +20,11 @@ SNOOZE_FILE="$STATE_DIR/update-snoozed"
 VERSION_FILE="$GSTACK_DIR/VERSION"
 REMOTE_URL="${GSTACK_REMOTE_URL:-https://raw.githubusercontent.com/garrytan/gstack/main/VERSION}"
 
+# ─── Force flag (busts cache for standalone /gstack-upgrade) ──
+if [ "${1:-}" = "--force" ]; then
+  rm -f "$CACHE_FILE"
+fi
+
 # ─── Step 0: Check if updates are disabled ────────────────────
 _UC=$("$GSTACK_DIR/bin/gstack-config" get update_check 2>/dev/null || true)
 if [ "$_UC" = "false" ]; then
@@ -97,24 +102,27 @@ if [ -f "$MARKER_FILE" ]; then
   exit 0
 fi
 
-# ─── Step 3: Check cache freshness (12h = 720 min) ──────────
+# ─── Step 3: Check cache freshness ──────────────────────────
+# UP_TO_DATE: 60 min TTL (detect new releases quickly)
+# UPGRADE_AVAILABLE: 720 min TTL (keep nagging)
 if [ -f "$CACHE_FILE" ]; then
-  # Cache is fresh if modified within 720 minutes
-  STALE=$(find "$CACHE_FILE" -mmin +720 2>/dev/null || true)
-  if [ -z "$STALE" ]; then
-    # Cache is fresh — read it
-    CACHED="$(cat "$CACHE_FILE" 2>/dev/null || true)"
+  CACHED="$(cat "$CACHE_FILE" 2>/dev/null || true)"
+  case "$CACHED" in
+    UP_TO_DATE*)        CACHE_TTL=60 ;;
+    UPGRADE_AVAILABLE*) CACHE_TTL=720 ;;
+    *)                  CACHE_TTL=0 ;;  # corrupt → force re-fetch
+  esac
+
+  STALE=$(find "$CACHE_FILE" -mmin +$CACHE_TTL 2>/dev/null || true)
+  if [ -z "$STALE" ] && [ "$CACHE_TTL" -gt 0 ]; then
     case "$CACHED" in
       UP_TO_DATE*)
-        # Verify local version still matches cached version
         CACHED_VER="$(echo "$CACHED" | awk '{print $2}')"
         if [ "$CACHED_VER" = "$LOCAL" ]; then
           exit 0
         fi
-        # Local version changed — fall through to re-check
         ;;
       UPGRADE_AVAILABLE*)
-        # Verify local version still matches cached old version
         CACHED_OLD="$(echo "$CACHED" | awk '{print $2}')"
         if [ "$CACHED_OLD" = "$LOCAL" ]; then
           CACHED_NEW="$(echo "$CACHED" | awk '{print $3}')"
@@ -124,7 +132,6 @@ if [ -f "$CACHE_FILE" ]; then
           echo "$CACHED"
           exit 0
         fi
-        # Local version changed (manual upgrade?) — fall through to re-check
         ;;
     esac
   fi
diff --git a/browse/test/gstack-update-check.test.ts b/browse/test/gstack-update-check.test.ts
index 2ec70e2d..66239931 100644
--- a/browse/test/gstack-update-check.test.ts
+++ b/browse/test/gstack-update-check.test.ts
@@ -7,7 +7,7 @@
  */
 
 import { describe, test, expect, beforeEach, afterEach } from 'bun:test';
-import { mkdtempSync, writeFileSync, rmSync, existsSync, readFileSync, mkdirSync, symlinkSync } from 'fs';
+import { mkdtempSync, writeFileSync, rmSync, existsSync, readFileSync, mkdirSync, symlinkSync, utimesSync } from 'fs';
 import { join } from 'path';
 import { tmpdir } from 'os';
 
@@ -16,8 +16,8 @@ const SCRIPT = join(import.meta.dir, '..', '..', 'bin', 'gstack-update-check');
 let gstackDir: string;
 let stateDir: string;
 
-function run(extraEnv: Record<string, string> = {}) {
-  const result = Bun.spawnSync(['bash', SCRIPT], {
+function run(extraEnv: Record<string, string> = {}, args: string[] = []) {
+  const result = Bun.spawnSync(['bash', SCRIPT, ...args], {
     env: {
       ...process.env,
       GSTACK_DIR: gstackDir,
@@ -412,4 +412,56 @@ describe('gstack-update-check', () => {
     expect(exitCode).toBe(0);
     expect(stdout).toBe('UPGRADE_AVAILABLE 0.3.3 0.4.0');
   });
+
+  // ─── --force flag tests ──────────────────────────────────────
+
+  test('--force busts fresh UP_TO_DATE cache', () => {
+    writeFileSync(join(gstackDir, 'VERSION'), '0.3.3\n');
+    writeFileSync(join(gstackDir, 'REMOTE_VERSION'), '0.4.0\n');
+    writeFileSync(join(stateDir, 'last-update-check'), 'UP_TO_DATE 0.3.3');
+
+    // Without --force: cache hit, silent
+    const cached = run();
+    expect(cached.stdout).toBe('');
+
+    // With --force: cache busted, re-fetches, finds upgrade
+    const forced = run({}, ['--force']);
+    expect(forced.exitCode).toBe(0);
+    expect(forced.stdout).toBe('UPGRADE_AVAILABLE 0.3.3 0.4.0');
+  });
+
+  test('--force busts fresh UPGRADE_AVAILABLE cache', () => {
+    writeFileSync(join(gstackDir, 'VERSION'), '0.3.3\n');
+    writeFileSync(join(gstackDir, 'REMOTE_VERSION'), '0.3.3\n');
+    writeFileSync(join(stateDir, 'last-update-check'), 'UPGRADE_AVAILABLE 0.3.3 0.4.0');
+
+    // Without --force: cache hit, outputs stale upgrade
+    const cached = run();
+    expect(cached.stdout).toBe('UPGRADE_AVAILABLE 0.3.3 0.4.0');
+
+    // With --force: cache busted, re-fetches, now up to date
+    const forced = run({}, ['--force']);
+    expect(forced.exitCode).toBe(0);
+    expect(forced.stdout).toBe('');
+    const cache = readFileSync(join(stateDir, 'last-update-check'), 'utf-8');
+    expect(cache).toContain('UP_TO_DATE');
+  });
+
+  // ─── Split TTL tests ─────────────────────────────────────────
+
+  test('UP_TO_DATE cache expires after 60 min (not 720)', () => {
+    writeFileSync(join(gstackDir, 'VERSION'), '0.3.3\n');
+    writeFileSync(join(gstackDir, 'REMOTE_VERSION'), '0.4.0\n');
+    writeFileSync(join(stateDir, 'last-update-check'), 'UP_TO_DATE 0.3.3');
+
+    // Set cache mtime to 90 minutes ago (past 60-min TTL)
+    const ninetyMinAgo = new Date(Date.now() - 90 * 60 * 1000);
+    const cachePath = join(stateDir, 'last-update-check');
+    utimesSync(cachePath, ninetyMinAgo, ninetyMinAgo);
+
+    // Cache should be stale at 60-min TTL, re-fetches and finds upgrade
+    const { exitCode, stdout } = run();
+    expect(exitCode).toBe(0);
+    expect(stdout).toBe('UPGRADE_AVAILABLE 0.3.3 0.4.0');
+  });
 });
diff --git a/gstack-upgrade/SKILL.md b/gstack-upgrade/SKILL.md
index 42f13f69..9d635651 100644
--- a/gstack-upgrade/SKILL.md
+++ b/gstack-upgrade/SKILL.md
@@ -189,4 +189,13 @@ After showing What's New, continue with whatever skill the user originally invok
 
 ## Standalone usage
 
-When invoked directly as `/gstack-upgrade` (not from a preamble), follow Steps 2-6 above. If already on the latest version, tell the user: "You're already on the latest version (v{version})."
+When invoked directly as `/gstack-upgrade` (not from a preamble):
+
+1. Force a fresh update check (bypass cache):
+```bash
+~/.claude/skills/gstack/bin/gstack-update-check --force
+```
+Use the output to determine if an upgrade is available.
+
+2. If `UPGRADE_AVAILABLE <old> <new>`: follow Steps 2-6 above.
+3. If no output (up to date): tell the user "You're already on the latest version (v{version})."
diff --git a/gstack-upgrade/SKILL.md.tmpl b/gstack-upgrade/SKILL.md.tmpl
index a199db6c..a441b8d6 100644
--- a/gstack-upgrade/SKILL.md.tmpl
+++ b/gstack-upgrade/SKILL.md.tmpl
@@ -187,4 +187,13 @@ After showing What's New, continue with whatever skill the user originally invok
 
 ## Standalone usage
 
-When invoked directly as `/gstack-upgrade` (not from a preamble), follow Steps 2-6 above. If already on the latest version, tell the user: "You're already on the latest version (v{version})."
+When invoked directly as `/gstack-upgrade` (not from a preamble):
+
+1. Force a fresh update check (bypass cache):
+```bash
+~/.claude/skills/gstack/bin/gstack-update-check --force
+```
+Use the output to determine if an upgrade is available.
+
+2. If `UPGRADE_AVAILABLE <old> <new>`: follow Steps 2-6 above.
+3. If no output (up to date): tell the user "You're already on the latest version (v{version})."

From 318ffdbdf01e9c6ad78ab41852803d955e9dc092 Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Mon, 16 Mar 2026 21:50:43 -0500
Subject: [PATCH 06/22] fix: js statement wrapping + click auto-routes option
 to selectOption (v0.4.5) (#117)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* fix: js statement wrapping + click auto-routes option to selectOption

Bug 1: js command wrapped all code as expressions — const, semicolons,
and multi-line code broke with SyntaxError. Added needsBlockWrapper()
and wrapForEvaluate() helpers (shared with eval) to detect statements
and use block wrapper {…} instead of expression wrapper (…).

Bug 2: clicking <option> refs hung forever because Playwright can't
.click() native select UI. Click handler now checks ARIA role + DOM
tagName and auto-routes to selectOption() via parent <select>.

Bug 3: click timeouts on <option> elements gave no guidance. Now
throws helpful error: "Use browse select instead of click."

* chore: bump version and changelog (v0.4.5)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 CHANGELOG.md                  | 15 +++++++++++
 VERSION                       |  2 +-
 browse/src/browser-manager.ts |  9 +++++++
 browse/src/read-commands.ts   | 30 ++++++++++++++-------
 browse/src/write-commands.ts  | 45 ++++++++++++++++++++++++++++---
 browse/test/commands.test.ts  | 51 +++++++++++++++++++++++++++++++++++
 6 files changed, 138 insertions(+), 14 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index d61ba4f2..530f0e75 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,20 @@
 # Changelog
 
+## 0.4.5 — 2026-03-16
+
+### Fixed
+
+- **`$B js "const x = await fetch(...); return x.status"` now works.** The `js` command used to wrap everything as an expression — so `const`, semicolons, and multi-line code all broke. It now detects statements and uses a block wrapper, just like `eval` already did.
+- **Clicking a dropdown option no longer hangs forever.** If an agent sees `@e3 [option] "Admin"` in a snapshot and runs `click @e3`, gstack now auto-selects that option instead of hanging on an impossible Playwright click. The right thing just happens.
+- **When click is the wrong tool, gstack tells you.** Clicking an `<option>` via CSS selector used to time out with a cryptic Playwright error. Now you get: `"Use 'browse select' instead of 'click' for dropdown options."`
+
+### For contributors
+
+- Extracted `needsBlockWrapper()` and `wrapForEvaluate()` helpers in `read-commands.ts` — shared by both `js` and `eval` commands (DRY).
+- Added `getRefRole()` to `BrowserManager` — exposes ARIA role for ref selectors without changing `resolveRef` return type.
+- Click handler auto-routes `[role=option]` refs to `selectOption()` via parent `<select>`, with DOM `tagName` check to avoid blocking custom listbox components.
+- 6 new tests: multi-line js, semicolons, statement keywords, simple expressions, option auto-routing, CSS option error guidance.
+
 ## 0.4.4 — 2026-03-16
 
 - **New releases detected in under an hour, not half a day.** The update check cache was set to 12 hours, which meant you could be stuck on an old version all day while new releases dropped. Now "you're up to date" expires after 60 minutes, so you'll see upgrades within the hour. "Upgrade available" still nags for 12 hours (that's the point).
diff --git a/VERSION b/VERSION
index 6f2743d6..0bfccb08 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.4.4
+0.4.5
diff --git a/browse/src/browser-manager.ts b/browse/src/browser-manager.ts
index 243ed177..260c8219 100644
--- a/browse/src/browser-manager.ts
+++ b/browse/src/browser-manager.ts
@@ -208,6 +208,15 @@ export class BrowserManager {
     return { selector };
   }
 
+  /** Get the ARIA role for a ref selector, or null for CSS selectors / unknown refs. */
+  getRefRole(selector: string): string | null {
+    if (selector.startsWith('@e') || selector.startsWith('@c')) {
+      const entry = this.refMap.get(selector.slice(1));
+      return entry?.role ?? null;
+    }
+    return null;
+  }
+
   getRefCount(): number {
     return this.refMap.size;
   }
diff --git a/browse/src/read-commands.ts b/browse/src/read-commands.ts
index a7d76352..54877562 100644
--- a/browse/src/read-commands.ts
+++ b/browse/src/read-commands.ts
@@ -17,6 +17,24 @@ function hasAwait(code: string): boolean {
   return /\bawait\b/.test(stripped);
 }
 
+/** Detect whether code needs a block wrapper {…} vs expression wrapper (…) inside an async IIFE. */
+function needsBlockWrapper(code: string): boolean {
+  const trimmed = code.trim();
+  if (trimmed.split('\n').length > 1) return true;
+  if (/\b(const|let|var|function|class|return|throw|if|for|while|switch|try)\b/.test(trimmed)) return true;
+  if (trimmed.includes(';')) return true;
+  return false;
+}
+
+/** Wrap code for page.evaluate(), using async IIFE with block or expression body as needed. */
+function wrapForEvaluate(code: string): string {
+  if (!hasAwait(code)) return code;
+  const trimmed = code.trim();
+  return needsBlockWrapper(trimmed)
+    ? `(async()=>{\n${code}\n})()`
+    : `(async()=>(${trimmed}))()`;
+}
+
 // Security: Path validation to prevent path traversal attacks
 const SAFE_DIRECTORIES = ['/tmp', process.cwd()];
 
@@ -124,7 +142,7 @@ export async function handleReadCommand(
     case 'js': {
       const expr = args[0];
       if (!expr) throw new Error('Usage: browse js <expression>');
-      const wrapped = hasAwait(expr) ? `(async()=>(${expr}))()` : expr;
+      const wrapped = wrapForEvaluate(expr);
       const result = await page.evaluate(wrapped);
       return typeof result === 'object' ? JSON.stringify(result, null, 2) : String(result ?? '');
     }
@@ -135,14 +153,8 @@ export async function handleReadCommand(
       validateReadPath(filePath);
       if (!fs.existsSync(filePath)) throw new Error(`File not found: ${filePath}`);
       const code = fs.readFileSync(filePath, 'utf-8');
-      if (hasAwait(code)) {
-        const trimmed = code.trim();
-        const isSingleExpr = trimmed.split('\n').length === 1;
-        const wrapped = isSingleExpr ? `(async()=>(${trimmed}))()` : `(async()=>{\n${code}\n})()`;
-        const result = await page.evaluate(wrapped);
-        return typeof result === 'object' ? JSON.stringify(result, null, 2) : String(result ?? '');
-      }
-      const result = await page.evaluate(code);
+      const wrapped = wrapForEvaluate(code);
+      const result = await page.evaluate(wrapped);
       return typeof result === 'object' ? JSON.stringify(result, null, 2) : String(result ?? '');
     }
 
diff --git a/browse/src/write-commands.ts b/browse/src/write-commands.ts
index 87b2fa5d..2b384920 100644
--- a/browse/src/write-commands.ts
+++ b/browse/src/write-commands.ts
@@ -44,11 +44,48 @@ export async function handleWriteCommand(
     case 'click': {
       const selector = args[0];
       if (!selector) throw new Error('Usage: browse click <selector>');
+
+      // Auto-route: if ref points to a real <option> inside a <select>, use selectOption
+      const role = bm.getRefRole(selector);
+      if (role === 'option') {
+        const resolved = await bm.resolveRef(selector);
+        if ('locator' in resolved) {
+          const optionInfo = await resolved.locator.evaluate(el => {
+            if (el.tagName !== 'OPTION') return null; // custom [role=option], not real <option>
+            const option = el as HTMLOptionElement;
+            const select = option.closest('select');
+            if (!select) return null;
+            return { value: option.value, text: option.text };
+          });
+          if (optionInfo) {
+            await resolved.locator.locator('xpath=ancestor::select').selectOption(optionInfo.value, { timeout: 5000 });
+            return `Selected "${optionInfo.text}" (auto-routed from click on <option>) → now at ${page.url()}`;
+          }
+          // Real <option> with no parent <select> or custom [role=option] — fall through to normal click
+        }
+      }
+
       const resolved = await bm.resolveRef(selector);
-      if ('locator' in resolved) {
-        await resolved.locator.click({ timeout: 5000 });
-      } else {
-        await page.click(resolved.selector, { timeout: 5000 });
+      try {
+        if ('locator' in resolved) {
+          await resolved.locator.click({ timeout: 5000 });
+        } else {
+          await page.click(resolved.selector, { timeout: 5000 });
+        }
+      } catch (err: any) {
+        // Enhanced error guidance: clicking <option> elements always fails (not visible / timeout)
+        const isOption = 'locator' in resolved
+          ? await resolved.locator.evaluate(el => el.tagName === 'OPTION').catch(() => false)
+          : await page.evaluate(
+              (sel: string) => document.querySelector(sel)?.tagName === 'OPTION',
+              (resolved as { selector: string }).selector
+            ).catch(() => false);
+        if (isOption) {
+          throw new Error(
+            `Cannot click <option> elements. Use 'browse select <parent-select> <value>' instead of 'click' for dropdown options.`
+          );
+        }
+        throw err;
       }
       // Wait briefly for any navigation/DOM update
       await page.waitForLoadState('domcontentloaded').catch(() => {});
diff --git a/browse/test/commands.test.ts b/browse/test/commands.test.ts
index d8aaeab6..ea68dff6 100644
--- a/browse/test/commands.test.ts
+++ b/browse/test/commands.test.ts
@@ -198,6 +198,27 @@ describe('Inspection', () => {
     }
   });
 
+  test('js handles multi-line with await', async () => {
+    const code = 'const x = await Promise.resolve(42);\nreturn x;';
+    const result = await handleReadCommand('js', [code], bm);
+    expect(result).toBe('42');
+  });
+
+  test('js handles await with semicolons', async () => {
+    const result = await handleReadCommand('js', ['const x = await Promise.resolve(5); return x + 1;'], bm);
+    expect(result).toBe('6');
+  });
+
+  test('js handles await with statement keywords', async () => {
+    const result = await handleReadCommand('js', ['const res = await Promise.resolve("ok"); return res;'], bm);
+    expect(result).toBe('ok');
+  });
+
+  test('js still works for simple expressions', async () => {
+    const result = await handleReadCommand('js', ['1 + 2'], bm);
+    expect(result).toBe('3');
+  });
+
   test('css returns computed property', async () => {
     const result = await handleReadCommand('css', ['h1', 'color'], bm);
     // Navy color
@@ -247,6 +268,36 @@ describe('Interaction', () => {
     expect(val).toBe('admin');
   });
 
+  test('click on option ref auto-routes to selectOption', async () => {
+    await handleWriteCommand('goto', [baseUrl + '/forms.html'], bm);
+    // Reset select to default
+    await handleReadCommand('js', ['document.querySelector("#role").value = ""'], bm);
+    const snap = await handleMetaCommand('snapshot', [], bm, async () => {});
+    // Find an option ref (e.g., "Admin" option)
+    const optionLine = snap.split('\n').find((l: string) => l.includes('[option]') && l.includes('"Admin"'));
+    expect(optionLine).toBeDefined();
+    const refMatch = optionLine!.match(/@(e\d+)/);
+    expect(refMatch).toBeDefined();
+    const ref = `@${refMatch![1]}`;
+    const result = await handleWriteCommand('click', [ref], bm);
+    expect(result).toContain('auto-routed');
+    expect(result).toContain('Selected');
+    // Verify the select value actually changed
+    const val = await handleReadCommand('js', ['document.querySelector("#role").value'], bm);
+    expect(val).toBe('admin');
+  });
+
+  test('click CSS selector on option gives helpful error', async () => {
+    await handleWriteCommand('goto', [baseUrl + '/forms.html'], bm);
+    try {
+      await handleWriteCommand('click', ['option[value="admin"]'], bm);
+      expect(true).toBe(false); // Should not reach here
+    } catch (err: any) {
+      expect(err.message).toContain('select');
+      expect(err.message).toContain('option');
+    }
+  }, 15000);
+
   test('hover works', async () => {
     const result = await handleWriteCommand('hover', ['h1'], bm);
     expect(result).toContain('Hovered');

From a30f7079da13904d32a50b73f1ff04c1ed75ca7c Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Mon, 16 Mar 2026 21:52:50 -0500
Subject: [PATCH 07/22] =?UTF-8?q?feat:=20Fix-First=20Review=20=E2=80=94=20?=
 =?UTF-8?q?auto-fix=20obvious=20issues,=20ask=20about=20hard=20ones=20(v0.?=
 =?UTF-8?q?4.5)=20(#116)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* feat: Fix-First Review — auto-fix obvious issues, ask about hard ones

Replace the CRITICAL-only AskUserQuestion flow with Fix-First:
- Every finding gets action (not just critical ones)
- AUTO-FIX items (dead code, N+1, stale comments) applied directly
- ASK items (security, race conditions, design decisions) batched
  into at most one AskUserQuestion
- Fix-First Heuristic in checklist.md (single source of truth)
- Gate Classification → Severity Classification rename

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* chore: bump version and changelog (v0.4.5)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: polish CHANGELOG v0.4.5 voice — lead with user benefit

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 CHANGELOG.md                  |  6 ++++
 review/SKILL.md               | 55 ++++++++++++++++++++++++++++++-----
 review/SKILL.md.tmpl          | 55 ++++++++++++++++++++++++++++++-----
 review/checklist.md           | 51 ++++++++++++++++++++++++++------
 ship/SKILL.md                 | 29 +++++++++++-------
 ship/SKILL.md.tmpl            | 29 +++++++++++-------
 test/skill-validation.test.ts | 17 +++++++++--
 7 files changed, 193 insertions(+), 49 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 530f0e75..0321b24c 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -2,6 +2,9 @@
 
 ## 0.4.5 — 2026-03-16
 
+- **Review findings now actually get fixed, not just listed.** `/review` and `/ship` used to print informational findings (dead code, test gaps, N+1 queries) and then ignore them. Now every finding gets action: obvious mechanical fixes are applied automatically, and genuinely ambiguous issues are batched into a single question instead of 8 separate prompts. You see `[AUTO-FIXED] file:line Problem → what was done` for each auto-fix.
+- **You control the line between "just fix it" and "ask me first."** Dead code, stale comments, N+1 queries get auto-fixed. Security issues, race conditions, design decisions get surfaced for your call. The classification lives in one place (`review/checklist.md`) so both `/review` and `/ship` stay in sync.
+
 ### Fixed
 
 - **`$B js "const x = await fetch(...); return x.status"` now works.** The `js` command used to wrap everything as an expression — so `const`, semicolons, and multi-line code all broke. It now detects statements and uses a block wrapper, just like `eval` already did.
@@ -10,6 +13,9 @@
 
 ### For contributors
 
+- Gate Classification → Severity Classification rename (severity determines presentation order, not whether you see a prompt).
+- Fix-First Heuristic section added to `review/checklist.md` — the canonical AUTO-FIX vs ASK classification.
+- New validation test: `Fix-First Heuristic exists in checklist and is referenced by review + ship`.
 - Extracted `needsBlockWrapper()` and `wrapForEvaluate()` helpers in `read-commands.ts` — shared by both `js` and `eval` commands (DRY).
 - Added `getRefRole()` to `BrowserManager` — exposes ARIA role for ref selectors without changing `resolveRef` return type.
 - Click handler auto-routes `[role=option]` refs to `selectOption()` via parent `<select>`, with DOM `tagName` check to avoid blocking custom listbox components.
diff --git a/review/SKILL.md b/review/SKILL.md
index c111e57a..3ad683d6 100644
--- a/review/SKILL.md
+++ b/review/SKILL.md
@@ -157,14 +157,53 @@ Follow the output format specified in the checklist. Respect the suppressions 
 
 ---
 
-## Step 5: Output findings
+## Step 5: Fix-First Review
 
-**Always output ALL findings** — both critical and informational. The user must see every issue.
+**Every finding gets action — not just critical ones.**
 
-- If CRITICAL issues found: output all findings, then for EACH critical issue use a separate AskUserQuestion with the problem, then `RECOMMENDATION: Choose A because [one-line reason]`, then options (A: Fix it now, B: Acknowledge, C: False positive — skip).
-  After all critical questions are answered, output a summary of what the user chose for each issue. If the user chose A (fix) on any issue, apply the recommended fixes. If only B/C were chosen, no action needed.
-- If only non-critical issues found: output findings. No further action needed.
-- If no issues found: output `Pre-Landing Review: No issues found.`
+Output a summary header: `Pre-Landing Review: N issues (X critical, Y informational)`
+
+### Step 5a: Classify each finding
+
+For each finding, classify as AUTO-FIX or ASK per the Fix-First Heuristic in
+checklist.md. Critical findings lean toward ASK; informational findings lean
+toward AUTO-FIX.
+
+### Step 5b: Auto-fix all AUTO-FIX items
+
+Apply each fix directly. For each one, output a one-line summary:
+`[AUTO-FIXED] [file:line] Problem → what you did`
+
+### Step 5c: Batch-ask about ASK items
+
+If there are ASK items remaining, present them in ONE AskUserQuestion:
+
+- List each item with a number, the severity label, the problem, and a recommended fix
+- For each item, provide options: A) Fix as recommended, B) Skip
+- Include an overall RECOMMENDATION
+
+Example format:
+```
+I auto-fixed 5 issues. 2 need your input:
+
+1. [CRITICAL] app/models/post.rb:42 — Race condition in status transition
+   Fix: Add `WHERE status = 'draft'` to the UPDATE
+   → A) Fix  B) Skip
+
+2. [INFORMATIONAL] app/services/generator.rb:88 — LLM output not type-checked before DB write
+   Fix: Add JSON schema validation
+   → A) Fix  B) Skip
+
+RECOMMENDATION: Fix both — #1 is a real race condition, #2 prevents silent data corruption.
+```
+
+If 3 or fewer ASK items, you may use individual AskUserQuestion calls instead of batching.
+
+### Step 5d: Apply user-approved fixes
+
+Apply fixes for items where the user chose "Fix." Output what was fixed.
+
+If no ASK items exist (everything was AUTO-FIX), skip the question entirely.
 
 ### Greptile comment resolution
 
@@ -174,7 +213,7 @@ After outputting your own findings, if Greptile comments were classified in Step
 
 Before replying to any comment, run the **Escalation Detection** algorithm from greptile-triage.md to determine whether to use Tier 1 (friendly) or Tier 2 (firm) reply templates.
 
-1. **VALID & ACTIONABLE comments:** These are already included in your CRITICAL findings — they follow the same AskUserQuestion flow (A: Fix it now, B: Acknowledge, C: False positive). If the user chooses A (fix), reply using the **Fix reply template** from greptile-triage.md (include inline diff + explanation). If the user chooses C (false positive), reply using the **False Positive reply template** (include evidence + suggested re-rank), save to both per-project and global greptile-history.
+1. **VALID & ACTIONABLE comments:** These are included in your findings — they follow the Fix-First flow (auto-fixed if mechanical, batched into ASK if not) (A: Fix it now, B: Acknowledge, C: False positive). If the user chooses A (fix), reply using the **Fix reply template** from greptile-triage.md (include inline diff + explanation). If the user chooses C (false positive), reply using the **False Positive reply template** (include evidence + suggested re-rank), save to both per-project and global greptile-history.
 
 2. **FALSE POSITIVE comments:** Present each one via AskUserQuestion:
    - Show the Greptile comment: file:line (or [top-level]) + body summary + permalink URL
@@ -223,7 +262,7 @@ If no documentation files exist, skip this step silently.
 ## Important Rules
 
 - **Read the FULL diff before commenting.** Do not flag issues already addressed in the diff.
-- **Read-only by default.** Only modify files if the user explicitly chooses "Fix it now" on a critical issue. Never commit, push, or create PRs.
+- **Fix-first, not read-only.** AUTO-FIX items are applied directly. ASK items are only applied after user approval. Never commit, push, or create PRs — that's /ship's job.
 - **Be terse.** One line problem, one line fix. No preamble.
 - **Only flag real problems.** Skip anything that's fine.
 - **Use Greptile reply templates from greptile-triage.md.** Every reply includes evidence. Never post vague replies.
diff --git a/review/SKILL.md.tmpl b/review/SKILL.md.tmpl
index f13dae4f..c122ada1 100644
--- a/review/SKILL.md.tmpl
+++ b/review/SKILL.md.tmpl
@@ -75,14 +75,53 @@ Follow the output format specified in the checklist. Respect the suppressions 
 
 ---
 
-## Step 5: Output findings
+## Step 5: Fix-First Review
 
-**Always output ALL findings** — both critical and informational. The user must see every issue.
+**Every finding gets action — not just critical ones.**
 
-- If CRITICAL issues found: output all findings, then for EACH critical issue use a separate AskUserQuestion with the problem, then `RECOMMENDATION: Choose A because [one-line reason]`, then options (A: Fix it now, B: Acknowledge, C: False positive — skip).
-  After all critical questions are answered, output a summary of what the user chose for each issue. If the user chose A (fix) on any issue, apply the recommended fixes. If only B/C were chosen, no action needed.
-- If only non-critical issues found: output findings. No further action needed.
-- If no issues found: output `Pre-Landing Review: No issues found.`
+Output a summary header: `Pre-Landing Review: N issues (X critical, Y informational)`
+
+### Step 5a: Classify each finding
+
+For each finding, classify as AUTO-FIX or ASK per the Fix-First Heuristic in
+checklist.md. Critical findings lean toward ASK; informational findings lean
+toward AUTO-FIX.
+
+### Step 5b: Auto-fix all AUTO-FIX items
+
+Apply each fix directly. For each one, output a one-line summary:
+`[AUTO-FIXED] [file:line] Problem → what you did`
+
+### Step 5c: Batch-ask about ASK items
+
+If there are ASK items remaining, present them in ONE AskUserQuestion:
+
+- List each item with a number, the severity label, the problem, and a recommended fix
+- For each item, provide options: A) Fix as recommended, B) Skip
+- Include an overall RECOMMENDATION
+
+Example format:
+```
+I auto-fixed 5 issues. 2 need your input:
+
+1. [CRITICAL] app/models/post.rb:42 — Race condition in status transition
+   Fix: Add `WHERE status = 'draft'` to the UPDATE
+   → A) Fix  B) Skip
+
+2. [INFORMATIONAL] app/services/generator.rb:88 — LLM output not type-checked before DB write
+   Fix: Add JSON schema validation
+   → A) Fix  B) Skip
+
+RECOMMENDATION: Fix both — #1 is a real race condition, #2 prevents silent data corruption.
+```
+
+If 3 or fewer ASK items, you may use individual AskUserQuestion calls instead of batching.
+
+### Step 5d: Apply user-approved fixes
+
+Apply fixes for items where the user chose "Fix." Output what was fixed.
+
+If no ASK items exist (everything was AUTO-FIX), skip the question entirely.
 
 ### Greptile comment resolution
 
@@ -92,7 +131,7 @@ After outputting your own findings, if Greptile comments were classified in Step
 
 Before replying to any comment, run the **Escalation Detection** algorithm from greptile-triage.md to determine whether to use Tier 1 (friendly) or Tier 2 (firm) reply templates.
 
-1. **VALID & ACTIONABLE comments:** These are already included in your CRITICAL findings — they follow the same AskUserQuestion flow (A: Fix it now, B: Acknowledge, C: False positive). If the user chooses A (fix), reply using the **Fix reply template** from greptile-triage.md (include inline diff + explanation). If the user chooses C (false positive), reply using the **False Positive reply template** (include evidence + suggested re-rank), save to both per-project and global greptile-history.
+1. **VALID & ACTIONABLE comments:** These are included in your findings — they follow the Fix-First flow (auto-fixed if mechanical, batched into ASK if not) (A: Fix it now, B: Acknowledge, C: False positive). If the user chooses A (fix), reply using the **Fix reply template** from greptile-triage.md (include inline diff + explanation). If the user chooses C (false positive), reply using the **False Positive reply template** (include evidence + suggested re-rank), save to both per-project and global greptile-history.
 
 2. **FALSE POSITIVE comments:** Present each one via AskUserQuestion:
    - Show the Greptile comment: file:line (or [top-level]) + body summary + permalink URL
@@ -141,7 +180,7 @@ If no documentation files exist, skip this step silently.
 ## Important Rules
 
 - **Read the FULL diff before commenting.** Do not flag issues already addressed in the diff.
-- **Read-only by default.** Only modify files if the user explicitly chooses "Fix it now" on a critical issue. Never commit, push, or create PRs.
+- **Fix-first, not read-only.** AUTO-FIX items are applied directly. ASK items are only applied after user approval. Never commit, push, or create PRs — that's /ship's job.
 - **Be terse.** One line problem, one line fix. No preamble.
 - **Only flag real problems.** Skip anything that's fine.
 - **Use Greptile reply templates from greptile-triage.md.** Every reply includes evidence. Never post vague replies.
diff --git a/review/checklist.md b/review/checklist.md
index 6052c33b..e2246050 100644
--- a/review/checklist.md
+++ b/review/checklist.md
@@ -5,21 +5,23 @@
 Review the `git diff origin/main` output for the issues listed below. Be specific — cite `file:line` and suggest fixes. Skip anything that's fine. Only flag real problems.
 
 **Two-pass review:**
-- **Pass 1 (CRITICAL):** Run SQL & Data Safety and LLM Output Trust Boundary first. These can block `/ship`.
-- **Pass 2 (INFORMATIONAL):** Run all remaining categories. These are included in the PR body but do not block.
+- **Pass 1 (CRITICAL):** Run SQL & Data Safety and LLM Output Trust Boundary first. Highest severity.
+- **Pass 2 (INFORMATIONAL):** Run all remaining categories. Lower severity but still actioned.
+
+All findings get action via Fix-First Review: obvious mechanical fixes are applied automatically,
+genuinely ambiguous issues are batched into a single user question.
 
 **Output format:**
 
 ```
 Pre-Landing Review: N issues (X critical, Y informational)
 
-**CRITICAL** (blocking /ship):
-- [file:line] Problem description
-  Fix: suggested fix
+**AUTO-FIXED:**
+- [file:line] Problem → fix applied
 
-**Issues** (non-blocking):
+**NEEDS INPUT:**
 - [file:line] Problem description
-  Fix: suggested fix
+  Recommended fix: suggested fix
 ```
 
 If no issues found: `Pre-Landing Review: No issues found.`
@@ -102,10 +104,10 @@ To do this: use Grep to find all references to the sibling values (e.g., grep fo
 
 ---
 
-## Gate Classification
+## Severity Classification
 
 ```
-CRITICAL (blocks /ship):          INFORMATIONAL (in PR body):
+CRITICAL (highest severity):      INFORMATIONAL (lower severity):
 ├─ SQL & Data Safety              ├─ Conditional Side Effects
 ├─ Race Conditions & Concurrency  ├─ Magic Numbers & String Coupling
 ├─ LLM Output Trust Boundary      ├─ Dead Code & Consistency
@@ -115,7 +117,38 @@ CRITICAL (blocks /ship):          INFORMATIONAL (in PR body):
                                    ├─ Time Window Safety
                                    ├─ Type Coercion at Boundaries
                                    └─ View/Frontend
+
+All findings are actioned via Fix-First Review. Severity determines
+presentation order and classification of AUTO-FIX vs ASK — critical
+findings lean toward ASK (they're riskier), informational findings
+lean toward AUTO-FIX (they're more mechanical).
+```
+
+---
+
+## Fix-First Heuristic
+
+This heuristic is referenced by both `/review` and `/ship`. It determines whether
+the agent auto-fixes a finding or asks the user.
+
 ```
+AUTO-FIX (agent fixes without asking):     ASK (needs human judgment):
+├─ Dead code / unused variables            ├─ Security (auth, XSS, injection)
+├─ N+1 queries (missing .includes())      ├─ Race conditions
+├─ Stale comments contradicting code       ├─ Design decisions
+├─ Magic numbers → named constants         ├─ Large fixes (>20 lines)
+├─ Missing LLM output validation           ├─ Enum completeness
+├─ Version/path mismatches                 ├─ Removing functionality
+├─ Variables assigned but never read       └─ Anything changing user-visible
+└─ Inline styles, O(n*m) view lookups        behavior
+```
+
+**Rule of thumb:** If the fix is mechanical and a senior engineer would apply it
+without discussion, it's AUTO-FIX. If reasonable engineers could disagree about
+the fix, it's ASK.
+
+**Critical findings default toward ASK** (they're inherently riskier).
+**Informational findings default toward AUTO-FIX** (they're more mechanical).
 
 ---
 
diff --git a/ship/SKILL.md b/ship/SKILL.md
index ee98ecaf..8aa4a181 100644
--- a/ship/SKILL.md
+++ b/ship/SKILL.md
@@ -107,7 +107,7 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 - On the base branch (abort)
 - Merge conflicts that can't be auto-resolved (stop, show conflicts)
 - Test failures (stop, show failures)
-- Pre-landing review finds CRITICAL issues and user chooses to fix (not acknowledge or skip)
+- Pre-landing review finds ASK items that need user judgment
 - MINOR or MAJOR version bump needed (ask — see Step 4)
 - Greptile review comments that need user decision (complex fixes, false positives)
 - TODOS.md missing and user wants to create one (ask — see Step 5.5)
@@ -120,6 +120,7 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 - Commit message approval (auto-commit)
 - Multi-file changesets (auto-split into bisectable commits)
 - TODOS.md completed-item detection (auto-mark)
+- Auto-fixable review findings (dead code, N+1, stale comments — fixed automatically)
 
 ---
 
@@ -243,19 +244,25 @@ Review the diff for structural issues that tests don't catch.
    - **Pass 1 (CRITICAL):** SQL & Data Safety, LLM Output Trust Boundary
    - **Pass 2 (INFORMATIONAL):** All remaining categories
 
-4. **Always output ALL findings** — both critical and informational. The user must see every issue found.
+4. **Classify each finding as AUTO-FIX or ASK** per the Fix-First Heuristic in
+   checklist.md. Critical findings lean toward ASK; informational lean toward AUTO-FIX.
 
-5. Output a summary header: `Pre-Landing Review: N issues (X critical, Y informational)`
+5. **Auto-fix all AUTO-FIX items.** Apply each fix. Output one line per fix:
+   `[AUTO-FIXED] [file:line] Problem → what you did`
 
-6. **If CRITICAL issues found:** For EACH critical issue, use a separate AskUserQuestion with:
-   - The problem (`file:line` + description)
-   - `RECOMMENDATION: Choose A because [one-line reason]`
-   - Options: A) Fix it now, B) Acknowledge and ship anyway, C) It's a false positive — skip
-   After resolving all critical issues: if the user chose A (fix) on any issue, apply the recommended fixes, then commit only the fixed files by name (`git add <fixed-files> && git commit -m "fix: apply pre-landing review fixes"`), then **STOP** and tell the user to run `/ship` again to re-test with the fixes applied. If the user chose only B (acknowledge) or C (false positive) on all issues, continue with Step 4.
+6. **If ASK items remain,** present them in ONE AskUserQuestion:
+   - List each with number, severity, problem, recommended fix
+   - Per-item options: A) Fix  B) Skip
+   - Overall RECOMMENDATION
+   - If 3 or fewer ASK items, you may use individual AskUserQuestion calls instead
 
-7. **If only non-critical issues found:** Output them and continue. They will be included in the PR body at Step 8.
+7. **After all fixes (auto + user-approved):**
+   - If ANY fixes were applied: commit fixed files by name (`git add <fixed-files> && git commit -m "fix: pre-landing review fixes"`), then **STOP** and tell the user to run `/ship` again to re-test.
+   - If no fixes applied (all ASK items skipped, or no issues found): continue to Step 4.
 
-8. **If no issues found:** Output `Pre-Landing Review: No issues found.` and continue.
+8. Output summary: `Pre-Landing Review: N issues — M auto-fixed, K asked (J fixed, L skipped)`
+
+   If no issues found: `Pre-Landing Review: No issues found.`
 
 Save the review output — it goes into the PR body in Step 8.
 
@@ -488,7 +495,7 @@ EOF
 - **Never skip tests.** If tests fail, stop.
 - **Never skip the pre-landing review.** If checklist.md is unreadable, stop.
 - **Never force push.** Use regular `git push` only.
-- **Never ask for confirmation** except for MINOR/MAJOR version bumps and CRITICAL review findings (one AskUserQuestion per critical issue with fix recommendation).
+- **Never ask for confirmation** except for MINOR/MAJOR version bumps and pre-landing review ASK items (batched into at most one AskUserQuestion).
 - **Always use the 4-digit version format** from the VERSION file.
 - **Date format in CHANGELOG:** `YYYY-MM-DD`
 - **Split commits for bisectability** — each commit = one logical change.
diff --git a/ship/SKILL.md.tmpl b/ship/SKILL.md.tmpl
index ae5df404..9339e90c 100644
--- a/ship/SKILL.md.tmpl
+++ b/ship/SKILL.md.tmpl
@@ -25,7 +25,7 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 - On the base branch (abort)
 - Merge conflicts that can't be auto-resolved (stop, show conflicts)
 - Test failures (stop, show failures)
-- Pre-landing review finds CRITICAL issues and user chooses to fix (not acknowledge or skip)
+- Pre-landing review finds ASK items that need user judgment
 - MINOR or MAJOR version bump needed (ask — see Step 4)
 - Greptile review comments that need user decision (complex fixes, false positives)
 - TODOS.md missing and user wants to create one (ask — see Step 5.5)
@@ -38,6 +38,7 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 - Commit message approval (auto-commit)
 - Multi-file changesets (auto-split into bisectable commits)
 - TODOS.md completed-item detection (auto-mark)
+- Auto-fixable review findings (dead code, N+1, stale comments — fixed automatically)
 
 ---
 
@@ -161,19 +162,25 @@ Review the diff for structural issues that tests don't catch.
    - **Pass 1 (CRITICAL):** SQL & Data Safety, LLM Output Trust Boundary
    - **Pass 2 (INFORMATIONAL):** All remaining categories
 
-4. **Always output ALL findings** — both critical and informational. The user must see every issue found.
+4. **Classify each finding as AUTO-FIX or ASK** per the Fix-First Heuristic in
+   checklist.md. Critical findings lean toward ASK; informational lean toward AUTO-FIX.
 
-5. Output a summary header: `Pre-Landing Review: N issues (X critical, Y informational)`
+5. **Auto-fix all AUTO-FIX items.** Apply each fix. Output one line per fix:
+   `[AUTO-FIXED] [file:line] Problem → what you did`
 
-6. **If CRITICAL issues found:** For EACH critical issue, use a separate AskUserQuestion with:
-   - The problem (`file:line` + description)
-   - `RECOMMENDATION: Choose A because [one-line reason]`
-   - Options: A) Fix it now, B) Acknowledge and ship anyway, C) It's a false positive — skip
-   After resolving all critical issues: if the user chose A (fix) on any issue, apply the recommended fixes, then commit only the fixed files by name (`git add <fixed-files> && git commit -m "fix: apply pre-landing review fixes"`), then **STOP** and tell the user to run `/ship` again to re-test with the fixes applied. If the user chose only B (acknowledge) or C (false positive) on all issues, continue with Step 4.
+6. **If ASK items remain,** present them in ONE AskUserQuestion:
+   - List each with number, severity, problem, recommended fix
+   - Per-item options: A) Fix  B) Skip
+   - Overall RECOMMENDATION
+   - If 3 or fewer ASK items, you may use individual AskUserQuestion calls instead
 
-7. **If only non-critical issues found:** Output them and continue. They will be included in the PR body at Step 8.
+7. **After all fixes (auto + user-approved):**
+   - If ANY fixes were applied: commit fixed files by name (`git add <fixed-files> && git commit -m "fix: pre-landing review fixes"`), then **STOP** and tell the user to run `/ship` again to re-test.
+   - If no fixes applied (all ASK items skipped, or no issues found): continue to Step 4.
 
-8. **If no issues found:** Output `Pre-Landing Review: No issues found.` and continue.
+8. Output summary: `Pre-Landing Review: N issues — M auto-fixed, K asked (J fixed, L skipped)`
+
+   If no issues found: `Pre-Landing Review: No issues found.`
 
 Save the review output — it goes into the PR body in Step 8.
 
@@ -406,7 +413,7 @@ EOF
 - **Never skip tests.** If tests fail, stop.
 - **Never skip the pre-landing review.** If checklist.md is unreadable, stop.
 - **Never force push.** Use regular `git push` only.
-- **Never ask for confirmation** except for MINOR/MAJOR version bumps and CRITICAL review findings (one AskUserQuestion per critical issue with fix recommendation).
+- **Never ask for confirmation** except for MINOR/MAJOR version bumps and pre-landing review ASK items (batched into at most one AskUserQuestion).
 - **Always use the 4-digit version format** from the VERSION file.
 - **Date format in CHANGELOG:** `YYYY-MM-DD`
 - **Split commits for bisectability** — each commit = one logical change.
diff --git a/test/skill-validation.test.ts b/test/skill-validation.test.ts
index a1817ede..cbb74d13 100644
--- a/test/skill-validation.test.ts
+++ b/test/skill-validation.test.ts
@@ -559,8 +559,8 @@ describe('Enum & Value Completeness in review checklist', () => {
     expect(checklist).toContain('allowlist');
   });
 
-  test('Enum & Value Completeness is in the gate classification as CRITICAL', () => {
-    const gateSection = checklist.slice(checklist.indexOf('## Gate Classification'));
+  test('Enum & Value Completeness is in the severity classification as CRITICAL', () => {
+    const gateSection = checklist.slice(checklist.indexOf('## Severity Classification'));
     // The ASCII art has CRITICAL on the left and INFORMATIONAL on the right
     // Enum & Value Completeness should appear on a line with the CRITICAL tree (├─ or └─)
     const enumLine = gateSection.split('\n').find(l => l.includes('Enum & Value Completeness'));
@@ -568,6 +568,19 @@ describe('Enum & Value Completeness in review checklist', () => {
     // It's on the left (CRITICAL) side — starts with ├─ or └─
     expect(enumLine!.trimStart().startsWith('├─') || enumLine!.trimStart().startsWith('└─')).toBe(true);
   });
+
+  test('Fix-First Heuristic exists in checklist and is referenced by review + ship', () => {
+    expect(checklist).toContain('## Fix-First Heuristic');
+    expect(checklist).toContain('AUTO-FIX');
+    expect(checklist).toContain('ASK');
+
+    const reviewSkill = fs.readFileSync(path.join(ROOT, 'review/SKILL.md'), 'utf-8');
+    const shipSkill = fs.readFileSync(path.join(ROOT, 'ship/SKILL.md'), 'utf-8');
+    expect(reviewSkill).toContain('AUTO-FIX');
+    expect(reviewSkill).toContain('[AUTO-FIXED]');
+    expect(shipSkill).toContain('AUTO-FIX');
+    expect(shipSkill).toContain('[AUTO-FIXED]');
+  });
 });
 
 // --- Part 7: Planted-bug fixture validation (A4) ---

From 4a77cc2c34506d9ce57193b3378e48e22b7b9842 Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Mon, 16 Mar 2026 21:55:07 -0500
Subject: [PATCH 08/22] feat: /plan-design-review + /qa-design-review skills
 (v0.5.0) (#102)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* feat: add {{DESIGN_METHODOLOGY}} resolver and register design review skills

Add generateDesignMethodology() to gen-skill-docs.ts with 10-category, 80-item
design audit checklist. Register plan-design-review and qa-design-review templates
in findTemplates(). Add both skills to skill-check.ts SKILL_FILES. Add command
and snapshot flag validation tests for both skills in skill-validation.test.ts.

* feat: add /plan-design-review and /qa-design-review skills

/plan-design-review: report-only designer audit with letter grades, AI slop
scoring, structured first impression, design system extraction, DESIGN.md
inference and export offer. Never modifies code.

/qa-design-review: same audit, then iterative fix loop with style(design):
commits, CSS-safe WTF heuristic, before/after screenshots, final re-audit.

* chore: bump version and changelog (v0.5.0)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* docs: update README, ARCHITECTURE for design review skills (v0.5.0)

- Update skill count to 11, add /plan-design-review and /qa-design-review
  to skill table, install/uninstall commands, and demo walkthrough
- Add narrative sections: "senior designer mode" and "designer who codes mode"
  with compelling examples showing AI Slop detection and design system inference
- Add {{DESIGN_METHODOLOGY}} to ARCHITECTURE.md placeholder table
- Extend demo to show full plan→eng→review→ship→qa→design-review pipeline

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* chore: regenerate design review SKILL.md files after merge from main

Picks up BASE_BRANCH_DETECT resolver and updated contributor mode from main.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* feat: add /design-consultation skill — design consultant that creates DESIGN.md

6-phase consultant flow: product context → competitive research (WebSearch) →
complete coherent proposal → drill-downs on demand → font+color preview page →
write DESIGN.md + update CLAUDE.md. Opinionated recommendations grounded in
product context, not menu-driven forms.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* test: add E2E tests for design skill family (7 tests + LLM quality judge)

Tests 1-4: /design-consultation (core flow, research integration, existing
DESIGN.md handling, font+color preview generation).
Tests 5-6: /plan-design-review (audit report, DESIGN.md export).
Test 7: /qa-design-review (audit + fix loop).
LLM judge validates font blacklist compliance, coherence, and AI slop avoidance.
Also adds plan-design-review + qa-design-review to ALL_SKILLS test array.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* chore: mark /design-consultation as shipped in TODOS.md

Renamed from /setup-design-md to reflect the consultant approach.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 ARCHITECTURE.md                   |   1 +
 CHANGELOG.md                      |  15 +
 CLAUDE.md                         |   8 +
 README.md                         | 127 +++++-
 TODOS.md                          |   8 +
 VERSION                           |   2 +-
 design-consultation/SKILL.md      | 382 ++++++++++++++++++
 design-consultation/SKILL.md.tmpl | 317 +++++++++++++++
 plan-design-review/SKILL.md       | 558 ++++++++++++++++++++++++++
 plan-design-review/SKILL.md.tmpl  | 147 +++++++
 qa-design-review/SKILL.md         | 645 ++++++++++++++++++++++++++++++
 qa-design-review/SKILL.md.tmpl    | 234 +++++++++++
 scripts/gen-skill-docs.ts         | 337 ++++++++++++++++
 scripts/skill-check.ts            |   2 +
 test/gen-skill-docs.test.ts       |   3 +
 test/skill-e2e.test.ts            | 552 +++++++++++++++++++++++++
 test/skill-validation.test.ts     |  34 ++
 17 files changed, 3367 insertions(+), 5 deletions(-)
 create mode 100644 design-consultation/SKILL.md
 create mode 100644 design-consultation/SKILL.md.tmpl
 create mode 100644 plan-design-review/SKILL.md
 create mode 100644 plan-design-review/SKILL.md.tmpl
 create mode 100644 qa-design-review/SKILL.md
 create mode 100644 qa-design-review/SKILL.md.tmpl

diff --git a/ARCHITECTURE.md b/ARCHITECTURE.md
index 45768d07..bccb13ff 100644
--- a/ARCHITECTURE.md
+++ b/ARCHITECTURE.md
@@ -202,6 +202,7 @@ Templates contain the workflows, tips, and examples that require human judgment.
 | `{{BROWSE_SETUP}}` | `gen-skill-docs.ts` | Binary discovery + setup instructions |
 | `{{BASE_BRANCH_DETECT}}` | `gen-skill-docs.ts` | Dynamic base branch detection for PR-targeting skills (ship, review, qa, plan-ceo-review) |
 | `{{QA_METHODOLOGY}}` | `gen-skill-docs.ts` | Shared QA methodology block for /qa and /qa-only |
+| `{{DESIGN_METHODOLOGY}}` | `gen-skill-docs.ts` | Shared design audit methodology for /plan-design-review and /qa-design-review |
 
 This is structurally sound — if a command exists in code, it appears in docs. If it doesn't exist, it can't appear.
 
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 0321b24c..a86569c8 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,20 @@
 # Changelog
 
+## 0.5.0 — 2026-03-16
+
+- **Your site just got a design review.** `/plan-design-review` opens your site and reviews it like a senior product designer — typography, spacing, hierarchy, color, responsive, interactions, and AI slop detection. Get letter grades (A-F) per category, a dual headline "Design Score" + "AI Slop Score", and a structured first impression that doesn't pull punches.
+- **It can fix what it finds, too.** `/qa-design-review` runs the same designer's eye audit, then iteratively fixes design issues in your source code with atomic `style(design):` commits and before/after screenshots. CSS-safe by default, with a stricter self-regulation heuristic tuned for styling changes.
+- **Know your actual design system.** Both skills extract your live site's fonts, colors, heading scale, and spacing patterns via JS — then offer to save the inferred system as a `DESIGN.md` baseline. Finally know how many fonts you're actually using.
+- **AI Slop detection is a headline metric.** Every report opens with two scores: Design Score and AI Slop Score. The AI slop checklist catches the 10 most recognizable AI-generated patterns — the 3-column feature grid, purple gradients, decorative blobs, emoji bullets, generic hero copy.
+- **Design regression tracking.** Reports write a `design-baseline.json`. Next run auto-compares: per-category grade deltas, new findings, resolved findings. Watch your design score improve over time.
+- **80-item design audit checklist** across 10 categories: visual hierarchy, typography, color/contrast, spacing/layout, interaction states, responsive, motion, content/microcopy, AI slop, and performance-as-design. Distilled from Vercel's 100+ rules, Anthropic's frontend design skill, and 6 other design frameworks.
+
+### For contributors
+
+- Added `{{DESIGN_METHODOLOGY}}` resolver to `gen-skill-docs.ts` — shared design audit methodology injected into both `/plan-design-review` and `/qa-design-review` templates, following the `{{QA_METHODOLOGY}}` pattern.
+- Added `~/.gstack-dev/plans/` as a local plans directory for long-range vision docs (not checked in). CLAUDE.md and TODOS.md updated.
+- Added `/setup-design-md` to TODOS.md (P2) for interactive DESIGN.md creation from scratch.
+
 ## 0.4.5 — 2026-03-16
 
 - **Review findings now actually get fixed, not just listed.** `/review` and `/ship` used to print informational findings (dead code, test gaps, N+1 queries) and then ignore them. Now every finding gets action: obvious mechanical fixes are applied automatically, and genuinely ambiguous issues are batched into a single question instead of 8 separate prompts. You see `[AUTO-FIXED] file:line Problem → what was done` for each auto-fix.
diff --git a/CLAUDE.md b/CLAUDE.md
index 85a7cda3..27523c7b 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -43,6 +43,8 @@ gstack/
 │   ├── skill-llm-eval.test.ts   # Tier 3: LLM-as-judge (~$0.15/run)
 │   └── skill-e2e.test.ts         # Tier 2: E2E via claude -p (~$3.85/run)
 ├── qa-only/         # /qa-only skill (report-only QA, no fixes)
+├── plan-design-review/  # /plan-design-review skill (report-only design audit)
+├── qa-design-review/    # /qa-design-review skill (design audit + fix loop)
 ├── ship/            # Ship workflow skill
 ├── review/          # PR review skill
 ├── plan-ceo-review/ # /plan-ceo-review skill
@@ -119,6 +121,12 @@ CHANGELOG.md is **for users**, not contributors. Write it like product release n
 - No jargon: say "every question now tells you which project and branch you're in" not
   "AskUserQuestion format standardized across skill templates via preamble resolver."
 
+## Local plans
+
+Contributors can store long-range vision docs and design documents in `~/.gstack-dev/plans/`.
+These are local-only (not checked in). When reviewing TODOS.md, check `plans/` for candidates
+that may be ready to promote to TODOs or implement.
+
 ## E2E eval failure blame protocol
 
 When an E2E eval fails during `/ship` or any other workflow, **never claim "not
diff --git a/README.md b/README.md
index 2b87d178..1db8d1de 100644
--- a/README.md
+++ b/README.md
@@ -2,7 +2,7 @@
 
 **gstack turns Claude Code from one generic assistant into a team of specialists you can summon on demand.**
 
-Ten opinionated workflow skills for [Claude Code](https://docs.anthropic.com/en/docs/claude-code). Plan review, code review, one-command shipping, browser automation, QA testing, engineering retrospectives, and post-ship documentation — all as slash commands.
+Twelve opinionated workflow skills for [Claude Code](https://docs.anthropic.com/en/docs/claude-code). Plan review, design review, code review, one-command shipping, browser automation, QA testing, engineering retrospectives, and post-ship documentation — all as slash commands.
 
 ### Without gstack
 
@@ -19,11 +19,13 @@ Ten opinionated workflow skills for [Claude Code](https://docs.anthropic.com/en/
 |-------|------|--------------|
 | `/plan-ceo-review` | Founder / CEO | Rethink the problem. Find the 10-star product hiding inside the request. |
 | `/plan-eng-review` | Eng manager / tech lead | Lock in architecture, data flow, diagrams, edge cases, and tests. |
+| `/plan-design-review` | Senior product designer | Designer's eye audit. 80-item checklist, letter grades, AI Slop detection, DESIGN.md inference. Report only — never touches code. |
 | `/review` | Paranoid staff engineer | Find the bugs that pass CI but blow up in production. Triages Greptile review comments. |
 | `/ship` | Release engineer | Sync main, run tests, resolve Greptile reviews, push, open PR. For a ready branch, not for deciding what to build. |
 | `/browse` | QA engineer | Give the agent eyes. It logs in, clicks through your app, takes screenshots, catches breakage. Full QA pass in 60 seconds. |
 | `/qa` | QA + fix engineer | Test app, find bugs, fix them with atomic commits, re-verify. Before/after health scores and ship-readiness summary. Three tiers: Quick, Standard, Exhaustive. |
 | `/qa-only` | QA reporter | Report-only QA testing. Same methodology as /qa but never fixes anything. Use when you want a pure bug report without code changes. |
+| `/qa-design-review` | Designer + frontend engineer | Same design audit as /plan-design-review, then fixes what it finds. Atomic `style(design):` commits, before/after screenshots, CSS-safe self-regulation. |
 | `/setup-browser-cookies` | Session manager | Import cookies from your real browser (Comet, Chrome, Arc, Brave, Edge) into the headless session. Test authenticated pages without logging in manually. |
 | `/retro` | Engineering manager | Team-aware retro: your deep-dive + per-person praise and growth opportunities for every contributor. |
 | `/document-release` | Technical writer | Update README, ARCHITECTURE, CONTRIBUTING, and project docs to match what you just shipped. |
@@ -79,6 +81,30 @@ You:   /qa https://staging.myapp.com --quick
 
 Claude: [Smoke test: homepage + 5 pages, 30 seconds]
         Health Score: 91/100. No critical issues. 1 medium: mobile nav overlap.
+
+You:   /plan-design-review https://staging.myapp.com
+
+Claude: Design Score: B  |  AI Slop Score: C
+
+        "The site communicates competence but not confidence."
+        "I notice the spacing between sections is uniform — nothing feels important."
+        "The first 3 things my eye goes to are: the gradient hero, a 3-column
+         feature grid with icons in circles, and a cookie-cutter CTA."
+        "If I had to describe this in one word: template."
+
+        Top issues: generic typography (Inter everywhere), AI slop patterns
+        (3-column icon grid, purple gradient), flat heading scale.
+
+        [Full report with letter grades, 12 findings, inferred design system]
+        Want me to save this as your DESIGN.md?
+
+You:   /qa-design-review
+
+Claude: [Runs the same audit, then fixes 8 design issues]
+        style(design): FINDING-001 — replace Inter with system font stack
+        style(design): FINDING-003 — add heading scale contrast
+        style(design): FINDING-007 — break 3-column grid into asymmetric layout
+        Design Score: B → A-  |  AI Slop Score: C → A
 ```
 
 ## Who this is for
@@ -105,11 +131,11 @@ This is the setup I use. One person, ten parallel agents, each with the right co
 
 Open Claude Code and paste this. Claude will do the rest.
 
-> Install gstack: run `git clone https://github.com/garrytan/gstack.git ~/.claude/skills/gstack && cd ~/.claude/skills/gstack && ./setup` then add a "gstack" section to CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, and lists the available skills: /plan-ceo-review, /plan-eng-review, /review, /ship, /browse, /qa, /qa-only, /setup-browser-cookies, /retro, /document-release. Then ask the user if they also want to add gstack to the current project so teammates get it.
+> Install gstack: run `git clone https://github.com/garrytan/gstack.git ~/.claude/skills/gstack && cd ~/.claude/skills/gstack && ./setup` then add a "gstack" section to CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, and lists the available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review, /review, /ship, /browse, /qa, /qa-only, /qa-design-review, /setup-browser-cookies, /retro, /document-release. Then ask the user if they also want to add gstack to the current project so teammates get it.
 
 ### Step 2: Add to your repo so teammates get it (optional)
 
-> Add gstack to this project: run `cp -Rf ~/.claude/skills/gstack .claude/skills/gstack && rm -rf .claude/skills/gstack/.git && cd .claude/skills/gstack && ./setup` then add a "gstack" section to this project's CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, lists the available skills: /plan-ceo-review, /plan-eng-review, /review, /ship, /browse, /qa, /setup-browser-cookies, /retro, /document-release, and tells Claude that if gstack skills aren't working, run `cd .claude/skills/gstack && ./setup` to build the binary and register skills.
+> Add gstack to this project: run `cp -Rf ~/.claude/skills/gstack .claude/skills/gstack && rm -rf .claude/skills/gstack/.git && cd .claude/skills/gstack && ./setup` then add a "gstack" section to this project's CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, lists the available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review, /review, /ship, /browse, /qa, /qa-only, /qa-design-review, /setup-browser-cookies, /retro, /document-release, and tells Claude that if gstack skills aren't working, run `cd .claude/skills/gstack && ./setup` to build the binary and register skills.
 
 Real files get committed to your repo (not a submodule), so `git clone` just works. The binary and node\_modules are gitignored — teammates just need to run `cd .claude/skills/gstack && ./setup` once to build (or `/browse` handles it automatically on first use).
 
@@ -258,6 +284,99 @@ Not "make the idea smaller."
 
 ---
 
+## `/plan-design-review`
+
+This is my **senior designer mode**.
+
+Most developers cannot tell whether their site looks AI-generated. I could not, until I started paying attention. There is a growing class of sites that are functional but soulless — they work fine but scream "an AI built this and nobody with taste looked at it." Purple gradients, 3-column icon grids, uniform bubbly border-radius on everything, centered text on every section, decorative blobs floating in the background. The ChatGPT aesthetic.
+
+`/plan-design-review` gives the agent a designer's eye.
+
+It opens your site and reacts to it the way a Stripe or Linear designer would — immediately, viscerally, with opinions. The first output is a structured gut reaction: what the site communicates at a glance, what the eye is drawn to, and a one-word verdict. That is the most valuable part. Everything after is supporting evidence.
+
+Then it extracts your actual design system by reading the CSS: how many fonts are you really using? What is your heading scale? How many colors? Is your spacing on a grid or arbitrary? It structures this as an **Inferred Design System** and offers to save it as a `DESIGN.md` — so now you have a design system you never had before, derived from what you actually shipped.
+
+The audit covers 80 items across 10 categories. Typography, spacing, hierarchy, color, responsive design, interaction states, motion, content quality, performance feel, and — the headline feature — **AI Slop Detection**. Ten specific anti-patterns that mark a site as machine-generated.
+
+Every finding gets a letter grade (A through F) per category. The report opens with two headline scores: **Design Score** and **AI Slop Score**. "Your site got a B on design but a D on AI Slop" tells you exactly where to focus.
+
+### Example
+
+```
+You:   /plan-design-review https://myapp.com
+
+Claude: Design Score: C  |  AI Slop Score: D
+
+        "The site communicates generic SaaS energy."
+        "I notice the hero section uses a blue-to-purple gradient
+         with a 3-column feature grid below it — the single most
+         recognizable AI-generated layout pattern."
+        "The first 3 things my eye goes to are: the gradient, the
+         symmetrical icon grid, and a 'Get Started' button that
+         looks like every other 'Get Started' button."
+        "If I had to describe this in one word: template."
+
+        Inferred Design System:
+        - Fonts: Inter (body), Inter (headings) — 1 font family
+        - Colors: 14 unique non-gray colors (flag: >12)
+        - Heading scale: 36/24/18/16 — flat, no drama between sizes
+        - Spacing: mostly 16px and 24px — no rhythm
+
+        Top 5 Design Improvements:
+        1. Break the 3-column icon grid (High, AI Slop)
+        2. Add heading scale contrast — at least 2:1 ratio (High, Typography)
+        3. Replace uniform border-radius with intentional hierarchy (Medium, Spacing)
+        4. Kill the gradient hero — use a real image or bold typography (High, AI Slop)
+        5. Add a second font for headings — Inter-only reads as generic (Medium, Typography)
+
+        [Full report saved to .gstack/design-reports/]
+        Want me to save this inferred design system as your DESIGN.md?
+```
+
+This is report only — it never touches your code. Use `/qa-design-review` when you want it to fix what it finds.
+
+---
+
+## `/qa-design-review`
+
+This is my **designer who codes mode**.
+
+`/plan-design-review` tells you what is wrong. `/qa-design-review` fixes it.
+
+It runs the same 80-item audit, then enters a fix loop: for each design finding, it locates the source file, makes the minimal CSS/styling change, commits with `style(design): FINDING-NNN`, re-navigates to verify, and takes before/after screenshots. One commit per fix, fully bisectable.
+
+The self-regulation heuristic is tuned for design work — CSS-only changes get a free pass (they are inherently safe and reversible), but changes to component JSX/TSX files count against the risk budget. Hard cap at 30 fixes. If the risk score exceeds 20%, it stops and asks.
+
+```
+You:   /qa-design-review https://myapp.com
+
+Claude: [Runs full design audit — same output as /plan-design-review]
+        Design Score: C  |  AI Slop Score: D
+        12 findings (4 high, 5 medium, 3 polish)
+
+        Fixing 9 design issues...
+
+        style(design): FINDING-001 — replace 3-column icon grid with asymmetric layout
+        style(design): FINDING-002 — add heading scale 48/32/24/18/16
+        style(design): FINDING-003 — remove gradient hero, use bold typography
+        style(design): FINDING-004 — add second font for headings
+        style(design): FINDING-005 — vary border-radius by element role
+        style(design): FINDING-006 — left-align body text, reserve center for headings
+        style(design): FINDING-007 — add hover/focus states to all interactive elements
+        style(design): FINDING-008 — add prefers-reduced-motion media query
+        style(design): FINDING-009 — set max content width to 680px for body text
+
+        Final audit:
+        Design Score: C → B+  |  AI Slop Score: D → A
+        9 fixes applied (8 verified, 1 best-effort). 3 deferred.
+
+        [Report with before/after screenshots saved to .gstack/design-reports/]
+```
+
+Nine commits, each touching one concern. The AI Slop score went from D to A because the three most recognizable patterns (gradient hero, 3-column grid, uniform radius) are gone. The design score improved two grades because the typography now has a scale, the spacing has hierarchy, and interactive elements have proper states.
+
+---
+
 ## `/review`
 
 This is my **paranoid staff engineer mode**.
@@ -638,7 +757,7 @@ Or set `auto_upgrade: true` in `~/.gstack/config.yaml` to upgrade automatically
 
 Paste this into Claude Code:
 
-> Uninstall gstack: remove the skill symlinks by running `for s in browse plan-ceo-review plan-eng-review review ship retro qa qa-only setup-browser-cookies document-release; do rm -f ~/.claude/skills/$s; done` then run `rm -rf ~/.claude/skills/gstack` and remove the gstack section from CLAUDE.md. If this project also has gstack at .claude/skills/gstack, remove it by running `for s in browse plan-ceo-review plan-eng-review review ship retro qa qa-only setup-browser-cookies document-release; do rm -f .claude/skills/$s; done && rm -rf .claude/skills/gstack` and remove the gstack section from the project CLAUDE.md too.
+> Uninstall gstack: remove the skill symlinks by running `for s in browse plan-ceo-review plan-eng-review plan-design-review review ship retro qa qa-only qa-design-review setup-browser-cookies document-release; do rm -f ~/.claude/skills/$s; done` then run `rm -rf ~/.claude/skills/gstack` and remove the gstack section from CLAUDE.md. If this project also has gstack at .claude/skills/gstack, remove it by running `for s in browse plan-ceo-review plan-eng-review plan-design-review review ship retro qa qa-only qa-design-review setup-browser-cookies document-release; do rm -f .claude/skills/$s; done && rm -rf .claude/skills/gstack` and remove the gstack section from the project CLAUDE.md too.
 
 ## Development
 
diff --git a/TODOS.md b/TODOS.md
index d2f9282e..d76f71c4 100644
--- a/TODOS.md
+++ b/TODOS.md
@@ -374,6 +374,14 @@
 **Priority:** P3
 **Depends on:** Ref staleness Parts 1+2 (shipped)
 
+## Design Review
+
+### /design-consultation interactive skill — SHIPPED
+
+~~**What:** Interactive skill that walks user through creating a DESIGN.md from scratch.~~
+
+Shipped as `/design-consultation` on garrytan/design branch. Renamed from `/setup-design-md` to reflect the consultant approach (agent proposes a complete coherent system, user adjusts). Includes competitive research via WebSearch, combined font+color preview page, coherence validation, and LLM-judged E2E tests.
+
 ## Document-Release
 
 ### Auto-invoke /document-release from /ship
diff --git a/VERSION b/VERSION
index 0bfccb08..8f0916f7 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.4.5
+0.5.0
diff --git a/design-consultation/SKILL.md b/design-consultation/SKILL.md
new file mode 100644
index 00000000..d92d47fd
--- /dev/null
+++ b/design-consultation/SKILL.md
@@ -0,0 +1,382 @@
+---
+name: design-consultation
+version: 1.0.0
+description: |
+  Design consultation: understands your product, researches competitors, proposes a
+  complete design system (aesthetic, typography, color, layout, spacing, motion), and
+  generates font+color preview pages. Creates DESIGN.md as your project's design source
+  of truth. For existing sites, use /plan-design-review to infer the system instead.
+allowed-tools:
+  - Bash
+  - Read
+  - Write
+  - Edit
+  - Glob
+  - Grep
+  - AskUserQuestion
+  - WebSearch
+---
+<!-- AUTO-GENERATED from SKILL.md.tmpl — do not edit directly -->
+<!-- Regenerate: bun run gen:skill-docs -->
+
+## Preamble (run first)
+
+```bash
+_UPD=$(~/.claude/skills/gstack/bin/gstack-update-check 2>/dev/null || .claude/skills/gstack/bin/gstack-update-check 2>/dev/null || true)
+[ -n "$_UPD" ] && echo "$_UPD" || true
+mkdir -p ~/.gstack/sessions
+touch ~/.gstack/sessions/"$PPID"
+_SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
+find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
+_CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
+```
+
+If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
+
+## AskUserQuestion Format
+
+**ALWAYS follow this structure for every AskUserQuestion call:**
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
+
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
+
+Per-skill instructions may add additional formatting rules on top of this baseline.
+
+## Contributor Mode
+
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
+
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
+
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
+
+```
+# {Title}
+
+Hey gstack team — ran into this while using /{skill-name}:
+
+**What I was trying to do:** {what the user/agent was attempting}
+**What happened instead:** {what actually happened}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
+
+## Steps to reproduce
+1. {step}
+
+## Raw output
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
+
+**Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
+```
+
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+
+# /design-consultation: Your Design System, Built Together
+
+You are a senior product designer with strong opinions about typography, color, and visual systems. You don't present menus — you listen, think, research, and propose. You're opinionated but not dogmatic. You explain your reasoning and welcome pushback.
+
+**Your posture:** Design consultant, not form wizard. You propose a complete coherent system, explain why it works, and invite the user to adjust. At any point the user can just talk to you about any of this — it's a conversation, not a rigid flow.
+
+---
+
+## Phase 0: Pre-checks
+
+**Check for existing DESIGN.md:**
+
+```bash
+ls DESIGN.md design-system.md 2>/dev/null || echo "NO_DESIGN_FILE"
+```
+
+- If a DESIGN.md exists: Read it. Ask the user: "You already have a design system. Want to **update** it, **start fresh**, or **cancel**?"
+- If no DESIGN.md: continue.
+
+**Gather product context from the codebase:**
+
+```bash
+cat README.md 2>/dev/null | head -50
+cat package.json 2>/dev/null | head -20
+ls src/ app/ pages/ components/ 2>/dev/null | head -30
+```
+
+Look for brainstorm output:
+
+```bash
+SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+ls ~/.gstack/projects/$SLUG/*brainstorm* 2>/dev/null | head -5
+ls .context/*brainstorm* .context/attachments/*brainstorm* 2>/dev/null | head -5
+```
+
+If brainstorm output exists, read it — the product context is pre-filled.
+
+If the codebase is empty and purpose is unclear, say: *"I don't have a clear picture of what you're building yet. Want to brainstorm first with `/brainstorm`? Once we know the product direction, we can set up the design system."*
+
+---
+
+## Phase 1: Product Context
+
+Ask the user a single question that covers everything you need to know. Pre-fill what you can infer from the codebase.
+
+**AskUserQuestion Q1 — include ALL of these:**
+1. Confirm what the product is, who it's for, what space/industry
+2. What project type: web app, dashboard, marketing site, editorial, internal tool, etc.
+3. "Want me to research what top products in your space are doing for design, or should I work from my design knowledge?"
+4. **Explicitly say:** "At any point you can just drop into chat and we'll talk through anything — this isn't a rigid form, it's a conversation."
+
+If the README or brainstorm gives you enough context, pre-fill and confirm: *"From what I can see, this is [X] for [Y] in the [Z] space. Sound right? And would you like me to research competitors, or should I work from what I know?"*
+
+---
+
+## Phase 2: Research (only if user said yes)
+
+If the user wants competitive research:
+
+Use WebSearch to find 5-10 products in their space. Search for:
+- "[product category] website design"
+- "[product category] best websites 2025"
+- "best [industry] web apps"
+
+For each competitor found, note: fonts used, color palette, layout approach, aesthetic direction.
+
+Summarize your findings conversationally:
+> "I looked at [competitors]. They tend toward [patterns] — lots of [common choices]. The opportunity to be distinctive is [gap]. Here's what I'd recommend based on this..."
+
+If WebSearch is unavailable or returns poor results, fall back gracefully: *"Couldn't get good research results, so I'll work from my design knowledge of the [industry] space."*
+
+If the user said no research, skip entirely and proceed to Phase 3 using your built-in design knowledge.
+
+---
+
+## Phase 3: The Complete Proposal
+
+This is the soul of the skill. Propose EVERYTHING as one coherent package.
+
+**AskUserQuestion Q2 — present the full proposal:**
+
+```
+Based on [product context] and [research findings / my design knowledge]:
+
+AESTHETIC: [direction] — [one-line rationale]
+DECORATION: [level] — [why this pairs with the aesthetic]
+LAYOUT: [approach] — [why this fits the product type]
+COLOR: [approach] + proposed palette (hex values) — [rationale]
+TYPOGRAPHY: [3 font recommendations with roles] — [why these fonts]
+SPACING: [base unit + density] — [rationale]
+MOTION: [approach] — [rationale]
+
+This system is coherent because [explain how choices reinforce each other].
+
+Want to adjust anything? You can drill into any section, or just tell me
+what feels off and I'll rework it. Or if this looks right, I'll generate
+a preview page so you can see the fonts and colors rendered.
+```
+
+**Options:** A) Looks great — generate the preview page. B) I want to adjust [section]. C) Start over with a different direction. D) Skip the preview, just write DESIGN.md.
+
+### Your Design Knowledge (use to inform proposals — do NOT display as tables)
+
+**Aesthetic directions** (pick the one that fits the product):
+- Brutally Minimal — Type and whitespace only. No decoration. Modernist.
+- Maximalist Chaos — Dense, layered, pattern-heavy. Y2K meets contemporary.
+- Retro-Futuristic — Vintage tech nostalgia. CRT glow, pixel grids, warm monospace.
+- Luxury/Refined — Serifs, high contrast, generous whitespace, precious metals.
+- Playful/Toy-like — Rounded, bouncy, bold primaries. Approachable and fun.
+- Editorial/Magazine — Strong typographic hierarchy, asymmetric grids, pull quotes.
+- Brutalist/Raw — Exposed structure, system fonts, visible grid, no polish.
+- Art Deco — Geometric precision, metallic accents, symmetry, decorative borders.
+- Organic/Natural — Earth tones, rounded forms, hand-drawn texture, grain.
+- Industrial/Utilitarian — Function-first, data-dense, monospace accents, muted palette.
+
+**Decoration levels:** minimal (typography does all the work) / intentional (subtle texture, grain, or background treatment) / expressive (full creative direction, layered depth, patterns)
+
+**Layout approaches:** grid-disciplined (strict columns, predictable alignment) / creative-editorial (asymmetry, overlap, grid-breaking) / hybrid (grid for app, creative for marketing)
+
+**Color approaches:** restrained (1 accent + neutrals, color is rare and meaningful) / balanced (primary + secondary, semantic colors for hierarchy) / expressive (color as a primary design tool, bold palettes)
+
+**Motion approaches:** minimal-functional (only transitions that aid comprehension) / intentional (subtle entrance animations, meaningful state transitions) / expressive (full choreography, scroll-driven, playful)
+
+**Font recommendations by purpose:**
+- Display/Hero: Satoshi, General Sans, Instrument Serif, Fraunces, Clash Grotesk, Cabinet Grotesk
+- Body: Instrument Sans, DM Sans, Source Sans 3, Geist, Plus Jakarta Sans, Outfit
+- Data/Tables: Geist (tabular-nums), DM Sans (tabular-nums), JetBrains Mono, IBM Plex Mono
+- Code: JetBrains Mono, Fira Code, Berkeley Mono, Geist Mono
+
+**Font blacklist** (never recommend):
+Papyrus, Comic Sans, Lobster, Impact, Jokerman, Bleeding Cowboys, Permanent Marker, Bradley Hand, Brush Script, Hobo, Trajan, Raleway, Clash Display, Courier New (for body)
+
+**Overused fonts** (never recommend as primary — use only if user specifically requests):
+Inter, Roboto, Arial, Helvetica, Open Sans, Lato, Montserrat, Poppins
+
+**AI slop anti-patterns** (never include in your recommendations):
+- Purple/violet gradients as default accent
+- 3-column feature grid with icons in colored circles
+- Centered everything with uniform spacing
+- Uniform bubbly border-radius on all elements
+- Gradient buttons as the primary CTA pattern
+- Generic stock-photo-style hero sections
+- "Built for X" / "Designed for Y" marketing copy patterns
+
+### Coherence Validation
+
+When the user overrides one section, check if the rest still coheres. Flag mismatches with a gentle nudge — never block:
+
+- Brutalist/Minimal aesthetic + expressive motion → "Heads up: brutalist aesthetics usually pair with minimal motion. Your combo is unusual — which is fine if intentional. Want me to suggest motion that fits, or keep it?"
+- Expressive color + restrained decoration → "Bold palette with minimal decoration can work, but the colors will carry a lot of weight. Want me to suggest decoration that supports the palette?"
+- Creative-editorial layout + data-heavy product → "Editorial layouts are gorgeous but can fight data density. Want me to show how a hybrid approach keeps both?"
+- Always accept the user's final choice. Never refuse to proceed.
+
+---
+
+## Phase 4: Drill-downs (only if user requests adjustments)
+
+When the user wants to change a specific section, go deep on that section:
+
+- **Fonts:** Present 3-5 specific candidates with rationale, explain what each evokes, offer the preview page
+- **Colors:** Present 2-3 palette options with hex values, explain the color theory reasoning
+- **Aesthetic:** Walk through which directions fit their product and why
+- **Layout/Spacing/Motion:** Present the approaches with concrete tradeoffs for their product type
+
+Each drill-down is one focused AskUserQuestion. After the user decides, re-check coherence with the rest of the system.
+
+---
+
+## Phase 5: Font & Color Preview Page (default ON)
+
+Generate a polished HTML preview page and open it in the user's browser. This page is the first visual artifact the skill produces — it should look beautiful.
+
+```bash
+PREVIEW_FILE="/tmp/design-consultation-preview-$(date +%s).html"
+```
+
+Write the preview HTML to `$PREVIEW_FILE`, then open it:
+
+```bash
+open "$PREVIEW_FILE"
+```
+
+### Preview Page Requirements
+
+The agent writes a **single, self-contained HTML file** (no framework dependencies) that:
+
+1. **Loads proposed fonts** from Google Fonts (or Bunny Fonts) via `<link>` tags
+2. **Uses the proposed color palette** throughout — dogfood the design system
+3. **Shows the product name** (not "Lorem Ipsum") as the hero heading
+4. **Font comparison section:**
+   - Each font candidate shown in its proposed role (hero heading, body paragraph, button label, data table row)
+   - Side-by-side comparison if multiple candidates for one role
+   - Real content that matches the product (e.g., civic tech → government data examples)
+5. **Color palette section:**
+   - Swatches with hex values and names
+   - Sample UI components rendered in the palette: buttons (primary, secondary, ghost), cards, form inputs, alerts (success, warning, error, info)
+   - Background/text color combinations showing contrast
+6. **Light/dark mode toggle** using CSS custom properties and a JS toggle button
+7. **Clean, professional layout** — the preview page IS a taste signal for the skill
+8. **Responsive** — looks good on any screen width
+
+The page should make the user think "oh nice, they thought of this." It's selling the design system visually, not just listing hex codes.
+
+If `open` fails (headless environment), tell the user: *"I wrote the preview to [path] — open it in your browser to see the fonts and colors rendered."*
+
+If the user says skip the preview, go directly to Phase 6.
+
+---
+
+## Phase 6: Write DESIGN.md & Confirm
+
+Write `DESIGN.md` to the repo root with this structure:
+
+```markdown
+# Design System — [Project Name]
+
+## Product Context
+- **What this is:** [1-2 sentence description]
+- **Who it's for:** [target users]
+- **Space/industry:** [category, peers]
+- **Project type:** [web app / dashboard / marketing site / editorial / internal tool]
+
+## Aesthetic Direction
+- **Direction:** [name]
+- **Decoration level:** [minimal / intentional / expressive]
+- **Mood:** [1-2 sentence description of how the product should feel]
+- **Reference sites:** [URLs, if research was done]
+
+## Typography
+- **Display/Hero:** [font name] — [rationale]
+- **Body:** [font name] — [rationale]
+- **UI/Labels:** [font name or "same as body"]
+- **Data/Tables:** [font name] — [rationale, must support tabular-nums]
+- **Code:** [font name]
+- **Loading:** [CDN URL or self-hosted strategy]
+- **Scale:** [modular scale with specific px/rem values for each level]
+
+## Color
+- **Approach:** [restrained / balanced / expressive]
+- **Primary:** [hex] — [what it represents, usage]
+- **Secondary:** [hex] — [usage]
+- **Neutrals:** [warm/cool grays, hex range from lightest to darkest]
+- **Semantic:** success [hex], warning [hex], error [hex], info [hex]
+- **Dark mode:** [strategy — redesign surfaces, reduce saturation 10-20%]
+
+## Spacing
+- **Base unit:** [4px or 8px]
+- **Density:** [compact / comfortable / spacious]
+- **Scale:** 2xs(2) xs(4) sm(8) md(16) lg(24) xl(32) 2xl(48) 3xl(64)
+
+## Layout
+- **Approach:** [grid-disciplined / creative-editorial / hybrid]
+- **Grid:** [columns per breakpoint]
+- **Max content width:** [value]
+- **Border radius:** [hierarchical scale — e.g., sm:4px, md:8px, lg:12px, full:9999px]
+
+## Motion
+- **Approach:** [minimal-functional / intentional / expressive]
+- **Easing:** enter(ease-out) exit(ease-in) move(ease-in-out)
+- **Duration:** micro(50-100ms) short(150-250ms) medium(250-400ms) long(400-700ms)
+
+## Decisions Log
+| Date | Decision | Rationale |
+|------|----------|-----------|
+| [today] | Initial design system created | Created by /design-consultation based on [product context / research] |
+```
+
+**Update CLAUDE.md** (or create it if it doesn't exist) — append this section:
+
+```markdown
+## Design System
+Always read DESIGN.md before making any visual or UI decisions.
+All font choices, colors, spacing, and aesthetic direction are defined there.
+Do not deviate without explicit user approval.
+In QA mode, flag any code that doesn't match DESIGN.md.
+```
+
+**AskUserQuestion Q-final — show summary and confirm:**
+
+List all decisions. Flag any that used agent defaults without explicit user confirmation (the user should know what they're shipping). Options:
+- A) Ship it — write DESIGN.md and CLAUDE.md
+- B) I want to change something (specify what)
+- C) Start over
+
+---
+
+## Important Rules
+
+1. **Propose, don't present menus.** You are a consultant, not a form. Make opinionated recommendations based on the product context, then let the user adjust.
+2. **Every recommendation needs a rationale.** Never say "I recommend X" without "because Y."
+3. **Coherence over individual choices.** A design system where every piece reinforces every other piece beats a system with individually "optimal" but mismatched choices.
+4. **Never recommend blacklisted or overused fonts as primary.** If the user specifically requests one, comply but explain the tradeoff.
+5. **The preview page must be beautiful.** It's the first visual output and sets the tone for the whole skill.
+6. **Conversational tone.** This isn't a rigid workflow. If the user wants to talk through a decision, engage as a thoughtful design partner.
+7. **Accept the user's final choice.** Nudge on coherence issues, but never block or refuse to write a DESIGN.md because you disagree with a choice.
+8. **No AI slop in your own output.** Your recommendations, your preview page, your DESIGN.md — all should demonstrate the taste you're asking the user to adopt.
diff --git a/design-consultation/SKILL.md.tmpl b/design-consultation/SKILL.md.tmpl
new file mode 100644
index 00000000..11d868fa
--- /dev/null
+++ b/design-consultation/SKILL.md.tmpl
@@ -0,0 +1,317 @@
+---
+name: design-consultation
+version: 1.0.0
+description: |
+  Design consultation: understands your product, researches competitors, proposes a
+  complete design system (aesthetic, typography, color, layout, spacing, motion), and
+  generates font+color preview pages. Creates DESIGN.md as your project's design source
+  of truth. For existing sites, use /plan-design-review to infer the system instead.
+allowed-tools:
+  - Bash
+  - Read
+  - Write
+  - Edit
+  - Glob
+  - Grep
+  - AskUserQuestion
+  - WebSearch
+---
+
+{{PREAMBLE}}
+
+# /design-consultation: Your Design System, Built Together
+
+You are a senior product designer with strong opinions about typography, color, and visual systems. You don't present menus — you listen, think, research, and propose. You're opinionated but not dogmatic. You explain your reasoning and welcome pushback.
+
+**Your posture:** Design consultant, not form wizard. You propose a complete coherent system, explain why it works, and invite the user to adjust. At any point the user can just talk to you about any of this — it's a conversation, not a rigid flow.
+
+---
+
+## Phase 0: Pre-checks
+
+**Check for existing DESIGN.md:**
+
+```bash
+ls DESIGN.md design-system.md 2>/dev/null || echo "NO_DESIGN_FILE"
+```
+
+- If a DESIGN.md exists: Read it. Ask the user: "You already have a design system. Want to **update** it, **start fresh**, or **cancel**?"
+- If no DESIGN.md: continue.
+
+**Gather product context from the codebase:**
+
+```bash
+cat README.md 2>/dev/null | head -50
+cat package.json 2>/dev/null | head -20
+ls src/ app/ pages/ components/ 2>/dev/null | head -30
+```
+
+Look for brainstorm output:
+
+```bash
+SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+ls ~/.gstack/projects/$SLUG/*brainstorm* 2>/dev/null | head -5
+ls .context/*brainstorm* .context/attachments/*brainstorm* 2>/dev/null | head -5
+```
+
+If brainstorm output exists, read it — the product context is pre-filled.
+
+If the codebase is empty and purpose is unclear, say: *"I don't have a clear picture of what you're building yet. Want to brainstorm first with `/brainstorm`? Once we know the product direction, we can set up the design system."*
+
+---
+
+## Phase 1: Product Context
+
+Ask the user a single question that covers everything you need to know. Pre-fill what you can infer from the codebase.
+
+**AskUserQuestion Q1 — include ALL of these:**
+1. Confirm what the product is, who it's for, what space/industry
+2. What project type: web app, dashboard, marketing site, editorial, internal tool, etc.
+3. "Want me to research what top products in your space are doing for design, or should I work from my design knowledge?"
+4. **Explicitly say:** "At any point you can just drop into chat and we'll talk through anything — this isn't a rigid form, it's a conversation."
+
+If the README or brainstorm gives you enough context, pre-fill and confirm: *"From what I can see, this is [X] for [Y] in the [Z] space. Sound right? And would you like me to research competitors, or should I work from what I know?"*
+
+---
+
+## Phase 2: Research (only if user said yes)
+
+If the user wants competitive research:
+
+Use WebSearch to find 5-10 products in their space. Search for:
+- "[product category] website design"
+- "[product category] best websites 2025"
+- "best [industry] web apps"
+
+For each competitor found, note: fonts used, color palette, layout approach, aesthetic direction.
+
+Summarize your findings conversationally:
+> "I looked at [competitors]. They tend toward [patterns] — lots of [common choices]. The opportunity to be distinctive is [gap]. Here's what I'd recommend based on this..."
+
+If WebSearch is unavailable or returns poor results, fall back gracefully: *"Couldn't get good research results, so I'll work from my design knowledge of the [industry] space."*
+
+If the user said no research, skip entirely and proceed to Phase 3 using your built-in design knowledge.
+
+---
+
+## Phase 3: The Complete Proposal
+
+This is the soul of the skill. Propose EVERYTHING as one coherent package.
+
+**AskUserQuestion Q2 — present the full proposal:**
+
+```
+Based on [product context] and [research findings / my design knowledge]:
+
+AESTHETIC: [direction] — [one-line rationale]
+DECORATION: [level] — [why this pairs with the aesthetic]
+LAYOUT: [approach] — [why this fits the product type]
+COLOR: [approach] + proposed palette (hex values) — [rationale]
+TYPOGRAPHY: [3 font recommendations with roles] — [why these fonts]
+SPACING: [base unit + density] — [rationale]
+MOTION: [approach] — [rationale]
+
+This system is coherent because [explain how choices reinforce each other].
+
+Want to adjust anything? You can drill into any section, or just tell me
+what feels off and I'll rework it. Or if this looks right, I'll generate
+a preview page so you can see the fonts and colors rendered.
+```
+
+**Options:** A) Looks great — generate the preview page. B) I want to adjust [section]. C) Start over with a different direction. D) Skip the preview, just write DESIGN.md.
+
+### Your Design Knowledge (use to inform proposals — do NOT display as tables)
+
+**Aesthetic directions** (pick the one that fits the product):
+- Brutally Minimal — Type and whitespace only. No decoration. Modernist.
+- Maximalist Chaos — Dense, layered, pattern-heavy. Y2K meets contemporary.
+- Retro-Futuristic — Vintage tech nostalgia. CRT glow, pixel grids, warm monospace.
+- Luxury/Refined — Serifs, high contrast, generous whitespace, precious metals.
+- Playful/Toy-like — Rounded, bouncy, bold primaries. Approachable and fun.
+- Editorial/Magazine — Strong typographic hierarchy, asymmetric grids, pull quotes.
+- Brutalist/Raw — Exposed structure, system fonts, visible grid, no polish.
+- Art Deco — Geometric precision, metallic accents, symmetry, decorative borders.
+- Organic/Natural — Earth tones, rounded forms, hand-drawn texture, grain.
+- Industrial/Utilitarian — Function-first, data-dense, monospace accents, muted palette.
+
+**Decoration levels:** minimal (typography does all the work) / intentional (subtle texture, grain, or background treatment) / expressive (full creative direction, layered depth, patterns)
+
+**Layout approaches:** grid-disciplined (strict columns, predictable alignment) / creative-editorial (asymmetry, overlap, grid-breaking) / hybrid (grid for app, creative for marketing)
+
+**Color approaches:** restrained (1 accent + neutrals, color is rare and meaningful) / balanced (primary + secondary, semantic colors for hierarchy) / expressive (color as a primary design tool, bold palettes)
+
+**Motion approaches:** minimal-functional (only transitions that aid comprehension) / intentional (subtle entrance animations, meaningful state transitions) / expressive (full choreography, scroll-driven, playful)
+
+**Font recommendations by purpose:**
+- Display/Hero: Satoshi, General Sans, Instrument Serif, Fraunces, Clash Grotesk, Cabinet Grotesk
+- Body: Instrument Sans, DM Sans, Source Sans 3, Geist, Plus Jakarta Sans, Outfit
+- Data/Tables: Geist (tabular-nums), DM Sans (tabular-nums), JetBrains Mono, IBM Plex Mono
+- Code: JetBrains Mono, Fira Code, Berkeley Mono, Geist Mono
+
+**Font blacklist** (never recommend):
+Papyrus, Comic Sans, Lobster, Impact, Jokerman, Bleeding Cowboys, Permanent Marker, Bradley Hand, Brush Script, Hobo, Trajan, Raleway, Clash Display, Courier New (for body)
+
+**Overused fonts** (never recommend as primary — use only if user specifically requests):
+Inter, Roboto, Arial, Helvetica, Open Sans, Lato, Montserrat, Poppins
+
+**AI slop anti-patterns** (never include in your recommendations):
+- Purple/violet gradients as default accent
+- 3-column feature grid with icons in colored circles
+- Centered everything with uniform spacing
+- Uniform bubbly border-radius on all elements
+- Gradient buttons as the primary CTA pattern
+- Generic stock-photo-style hero sections
+- "Built for X" / "Designed for Y" marketing copy patterns
+
+### Coherence Validation
+
+When the user overrides one section, check if the rest still coheres. Flag mismatches with a gentle nudge — never block:
+
+- Brutalist/Minimal aesthetic + expressive motion → "Heads up: brutalist aesthetics usually pair with minimal motion. Your combo is unusual — which is fine if intentional. Want me to suggest motion that fits, or keep it?"
+- Expressive color + restrained decoration → "Bold palette with minimal decoration can work, but the colors will carry a lot of weight. Want me to suggest decoration that supports the palette?"
+- Creative-editorial layout + data-heavy product → "Editorial layouts are gorgeous but can fight data density. Want me to show how a hybrid approach keeps both?"
+- Always accept the user's final choice. Never refuse to proceed.
+
+---
+
+## Phase 4: Drill-downs (only if user requests adjustments)
+
+When the user wants to change a specific section, go deep on that section:
+
+- **Fonts:** Present 3-5 specific candidates with rationale, explain what each evokes, offer the preview page
+- **Colors:** Present 2-3 palette options with hex values, explain the color theory reasoning
+- **Aesthetic:** Walk through which directions fit their product and why
+- **Layout/Spacing/Motion:** Present the approaches with concrete tradeoffs for their product type
+
+Each drill-down is one focused AskUserQuestion. After the user decides, re-check coherence with the rest of the system.
+
+---
+
+## Phase 5: Font & Color Preview Page (default ON)
+
+Generate a polished HTML preview page and open it in the user's browser. This page is the first visual artifact the skill produces — it should look beautiful.
+
+```bash
+PREVIEW_FILE="/tmp/design-consultation-preview-$(date +%s).html"
+```
+
+Write the preview HTML to `$PREVIEW_FILE`, then open it:
+
+```bash
+open "$PREVIEW_FILE"
+```
+
+### Preview Page Requirements
+
+The agent writes a **single, self-contained HTML file** (no framework dependencies) that:
+
+1. **Loads proposed fonts** from Google Fonts (or Bunny Fonts) via `<link>` tags
+2. **Uses the proposed color palette** throughout — dogfood the design system
+3. **Shows the product name** (not "Lorem Ipsum") as the hero heading
+4. **Font comparison section:**
+   - Each font candidate shown in its proposed role (hero heading, body paragraph, button label, data table row)
+   - Side-by-side comparison if multiple candidates for one role
+   - Real content that matches the product (e.g., civic tech → government data examples)
+5. **Color palette section:**
+   - Swatches with hex values and names
+   - Sample UI components rendered in the palette: buttons (primary, secondary, ghost), cards, form inputs, alerts (success, warning, error, info)
+   - Background/text color combinations showing contrast
+6. **Light/dark mode toggle** using CSS custom properties and a JS toggle button
+7. **Clean, professional layout** — the preview page IS a taste signal for the skill
+8. **Responsive** — looks good on any screen width
+
+The page should make the user think "oh nice, they thought of this." It's selling the design system visually, not just listing hex codes.
+
+If `open` fails (headless environment), tell the user: *"I wrote the preview to [path] — open it in your browser to see the fonts and colors rendered."*
+
+If the user says skip the preview, go directly to Phase 6.
+
+---
+
+## Phase 6: Write DESIGN.md & Confirm
+
+Write `DESIGN.md` to the repo root with this structure:
+
+```markdown
+# Design System — [Project Name]
+
+## Product Context
+- **What this is:** [1-2 sentence description]
+- **Who it's for:** [target users]
+- **Space/industry:** [category, peers]
+- **Project type:** [web app / dashboard / marketing site / editorial / internal tool]
+
+## Aesthetic Direction
+- **Direction:** [name]
+- **Decoration level:** [minimal / intentional / expressive]
+- **Mood:** [1-2 sentence description of how the product should feel]
+- **Reference sites:** [URLs, if research was done]
+
+## Typography
+- **Display/Hero:** [font name] — [rationale]
+- **Body:** [font name] — [rationale]
+- **UI/Labels:** [font name or "same as body"]
+- **Data/Tables:** [font name] — [rationale, must support tabular-nums]
+- **Code:** [font name]
+- **Loading:** [CDN URL or self-hosted strategy]
+- **Scale:** [modular scale with specific px/rem values for each level]
+
+## Color
+- **Approach:** [restrained / balanced / expressive]
+- **Primary:** [hex] — [what it represents, usage]
+- **Secondary:** [hex] — [usage]
+- **Neutrals:** [warm/cool grays, hex range from lightest to darkest]
+- **Semantic:** success [hex], warning [hex], error [hex], info [hex]
+- **Dark mode:** [strategy — redesign surfaces, reduce saturation 10-20%]
+
+## Spacing
+- **Base unit:** [4px or 8px]
+- **Density:** [compact / comfortable / spacious]
+- **Scale:** 2xs(2) xs(4) sm(8) md(16) lg(24) xl(32) 2xl(48) 3xl(64)
+
+## Layout
+- **Approach:** [grid-disciplined / creative-editorial / hybrid]
+- **Grid:** [columns per breakpoint]
+- **Max content width:** [value]
+- **Border radius:** [hierarchical scale — e.g., sm:4px, md:8px, lg:12px, full:9999px]
+
+## Motion
+- **Approach:** [minimal-functional / intentional / expressive]
+- **Easing:** enter(ease-out) exit(ease-in) move(ease-in-out)
+- **Duration:** micro(50-100ms) short(150-250ms) medium(250-400ms) long(400-700ms)
+
+## Decisions Log
+| Date | Decision | Rationale |
+|------|----------|-----------|
+| [today] | Initial design system created | Created by /design-consultation based on [product context / research] |
+```
+
+**Update CLAUDE.md** (or create it if it doesn't exist) — append this section:
+
+```markdown
+## Design System
+Always read DESIGN.md before making any visual or UI decisions.
+All font choices, colors, spacing, and aesthetic direction are defined there.
+Do not deviate without explicit user approval.
+In QA mode, flag any code that doesn't match DESIGN.md.
+```
+
+**AskUserQuestion Q-final — show summary and confirm:**
+
+List all decisions. Flag any that used agent defaults without explicit user confirmation (the user should know what they're shipping). Options:
+- A) Ship it — write DESIGN.md and CLAUDE.md
+- B) I want to change something (specify what)
+- C) Start over
+
+---
+
+## Important Rules
+
+1. **Propose, don't present menus.** You are a consultant, not a form. Make opinionated recommendations based on the product context, then let the user adjust.
+2. **Every recommendation needs a rationale.** Never say "I recommend X" without "because Y."
+3. **Coherence over individual choices.** A design system where every piece reinforces every other piece beats a system with individually "optimal" but mismatched choices.
+4. **Never recommend blacklisted or overused fonts as primary.** If the user specifically requests one, comply but explain the tradeoff.
+5. **The preview page must be beautiful.** It's the first visual output and sets the tone for the whole skill.
+6. **Conversational tone.** This isn't a rigid workflow. If the user wants to talk through a decision, engage as a thoughtful design partner.
+7. **Accept the user's final choice.** Nudge on coherence issues, but never block or refuse to write a DESIGN.md because you disagree with a choice.
+8. **No AI slop in your own output.** Your recommendations, your preview page, your DESIGN.md — all should demonstrate the taste you're asking the user to adopt.
diff --git a/plan-design-review/SKILL.md b/plan-design-review/SKILL.md
new file mode 100644
index 00000000..c0ca9512
--- /dev/null
+++ b/plan-design-review/SKILL.md
@@ -0,0 +1,558 @@
+---
+name: plan-design-review
+version: 1.0.0
+description: |
+  Designer's eye review of a live site. Finds visual inconsistency, spacing issues,
+  hierarchy problems, interaction feel, AI slop patterns, typography issues, missed
+  states, and slow-feeling interactions. Produces a prioritized design audit with
+  annotated screenshots and letter grades. Infers your design system and offers to
+  export as DESIGN.md. Report-only — never modifies code. For the fix loop, use
+  /qa-design-review instead.
+allowed-tools:
+  - Bash
+  - Read
+  - Write
+  - AskUserQuestion
+---
+<!-- AUTO-GENERATED from SKILL.md.tmpl — do not edit directly -->
+<!-- Regenerate: bun run gen:skill-docs -->
+
+## Preamble (run first)
+
+```bash
+_UPD=$(~/.claude/skills/gstack/bin/gstack-update-check 2>/dev/null || .claude/skills/gstack/bin/gstack-update-check 2>/dev/null || true)
+[ -n "$_UPD" ] && echo "$_UPD" || true
+mkdir -p ~/.gstack/sessions
+touch ~/.gstack/sessions/"$PPID"
+_SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
+find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
+_CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
+```
+
+If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
+
+## AskUserQuestion Format
+
+**ALWAYS follow this structure for every AskUserQuestion call:**
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
+
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
+
+Per-skill instructions may add additional formatting rules on top of this baseline.
+
+## Contributor Mode
+
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
+
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
+
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
+
+```
+# {Title}
+
+Hey gstack team — ran into this while using /{skill-name}:
+
+**What I was trying to do:** {what the user/agent was attempting}
+**What happened instead:** {what actually happened}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
+
+## Steps to reproduce
+1. {step}
+
+## Raw output
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
+
+**Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
+```
+
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+
+# /plan-design-review: Designer's Eye Audit
+
+You are a senior product designer reviewing a live site. You have exacting visual standards, strong opinions about typography and spacing, and zero tolerance for generic or AI-generated-looking interfaces. You do NOT care whether things "work." You care whether they feel right, look intentional, and respect the user.
+
+## Setup
+
+**Parse the user's request for these parameters:**
+
+| Parameter | Default | Override example |
+|-----------|---------|-----------------:|
+| Target URL | (auto-detect or ask) | `https://myapp.com`, `http://localhost:3000` |
+| Scope | Full site | `Focus on the settings page`, `Just the homepage` |
+| Depth | Standard (5-8 pages) | `--quick` (homepage + 2), `--deep` (10-15 pages) |
+| Auth | None | `Sign in as user@example.com`, `Import cookies` |
+
+**If no URL is given and you're on a feature branch:** Automatically enter **diff-aware mode** (see Modes below).
+
+**If no URL is given and you're on main/master:** Ask the user for a URL.
+
+**Check for DESIGN.md:**
+
+Look for `DESIGN.md`, `design-system.md`, or similar in the repo root. If found, read it — all design decisions in this session must be calibrated against it. Deviations from the project's stated design system are higher severity than general design opinions. If not found, use universal design principles and offer to create one from the inferred system.
+
+**Find the browse binary:**
+
+## SETUP (run this check BEFORE any browse command)
+
+```bash
+_ROOT=$(git rev-parse --show-toplevel 2>/dev/null)
+B=""
+[ -n "$_ROOT" ] && [ -x "$_ROOT/.claude/skills/gstack/browse/dist/browse" ] && B="$_ROOT/.claude/skills/gstack/browse/dist/browse"
+[ -z "$B" ] && B=~/.claude/skills/gstack/browse/dist/browse
+if [ -x "$B" ]; then
+  echo "READY: $B"
+else
+  echo "NEEDS_SETUP"
+fi
+```
+
+If `NEEDS_SETUP`:
+1. Tell the user: "gstack browse needs a one-time build (~10 seconds). OK to proceed?" Then STOP and wait.
+2. Run: `cd <SKILL_DIR> && ./setup`
+3. If `bun` is not installed: `curl -fsSL https://bun.sh/install | bash`
+
+**Create output directories:**
+
+```bash
+REPORT_DIR=".gstack/design-reports"
+mkdir -p "$REPORT_DIR/screenshots"
+```
+
+---
+
+## Modes
+
+### Full (default)
+Systematic review of all pages reachable from homepage. Visit 5-8 pages. Full checklist evaluation, responsive screenshots, interaction flow testing. Produces complete design audit report with letter grades.
+
+### Quick (`--quick`)
+Homepage + 2 key pages only. First Impression + Design System Extraction + abbreviated checklist. Fastest path to a design score.
+
+### Deep (`--deep`)
+Comprehensive review: 10-15 pages, every interaction flow, exhaustive checklist. For pre-launch audits or major redesigns.
+
+### Diff-aware (automatic when on a feature branch with no URL)
+When on a feature branch, scope to pages affected by the branch changes:
+1. Analyze the branch diff: `git diff main...HEAD --name-only`
+2. Map changed files to affected pages/routes
+3. Detect running app on common local ports (3000, 4000, 8080)
+4. Audit only affected pages, compare design quality before/after
+
+### Regression (`--regression` or previous `design-baseline.json` found)
+Run full audit, then load previous `design-baseline.json`. Compare: per-category grade deltas, new findings, resolved findings. Output regression table in report.
+
+---
+
+## Phase 1: First Impression
+
+The most uniquely designer-like output. Form a gut reaction before analyzing anything.
+
+1. Navigate to the target URL
+2. Take a full-page desktop screenshot: `$B screenshot "$REPORT_DIR/screenshots/first-impression.png"`
+3. Write the **First Impression** using this structured critique format:
+   - "The site communicates **[what]**." (what it says at a glance — competence? playfulness? confusion?)
+   - "I notice **[observation]**." (what stands out, positive or negative — be specific)
+   - "The first 3 things my eye goes to are: **[1]**, **[2]**, **[3]**." (hierarchy check — are these intentional?)
+   - "If I had to describe this in one word: **[word]**." (gut verdict)
+
+This is the section users read first. Be opinionated. A designer doesn't hedge — they react.
+
+---
+
+## Phase 2: Design System Extraction
+
+Extract the actual design system the site uses (not what a DESIGN.md says, but what's rendered):
+
+```bash
+# Fonts in use (capped at 500 elements to avoid timeout)
+$B js "JSON.stringify([...new Set([...document.querySelectorAll('*')].slice(0,500).map(e => getComputedStyle(e).fontFamily))])"
+
+# Color palette in use
+$B js "JSON.stringify([...new Set([...document.querySelectorAll('*')].slice(0,500).flatMap(e => [getComputedStyle(e).color, getComputedStyle(e).backgroundColor]).filter(c => c !== 'rgba(0, 0, 0, 0)'))])"
+
+# Heading hierarchy
+$B js "JSON.stringify([...document.querySelectorAll('h1,h2,h3,h4,h5,h6')].map(h => ({tag:h.tagName, text:h.textContent.trim().slice(0,50), size:getComputedStyle(h).fontSize, weight:getComputedStyle(h).fontWeight})))"
+
+# Touch target audit (find undersized interactive elements)
+$B js "JSON.stringify([...document.querySelectorAll('a,button,input,[role=button]')].filter(e => {const r=e.getBoundingClientRect(); return r.width>0 && (r.width<44||r.height<44)}).map(e => ({tag:e.tagName, text:(e.textContent||'').trim().slice(0,30), w:Math.round(e.getBoundingClientRect().width), h:Math.round(e.getBoundingClientRect().height)})).slice(0,20))"
+
+# Performance baseline
+$B perf
+```
+
+Structure findings as an **Inferred Design System**:
+- **Fonts:** list with usage counts. Flag if >3 distinct font families.
+- **Colors:** palette extracted. Flag if >12 unique non-gray colors. Note warm/cool/mixed.
+- **Heading Scale:** h1-h6 sizes. Flag skipped levels, non-systematic size jumps.
+- **Spacing Patterns:** sample padding/margin values. Flag non-scale values.
+
+After extraction, offer: *"Want me to save this as your DESIGN.md? I can lock in these observations as your project's design system baseline."*
+
+---
+
+## Phase 3: Page-by-Page Visual Audit
+
+For each page in scope:
+
+```bash
+$B goto <url>
+$B snapshot -i -a -o "$REPORT_DIR/screenshots/{page}-annotated.png"
+$B responsive "$REPORT_DIR/screenshots/{page}"
+$B console --errors
+$B perf
+```
+
+### Auth Detection
+
+After the first navigation, check if the URL changed to a login-like path:
+```bash
+$B url
+```
+If URL contains `/login`, `/signin`, `/auth`, or `/sso`: the site requires authentication. AskUserQuestion: "This site requires authentication. Want to import cookies from your browser? Run `/setup-browser-cookies` first if needed."
+
+### Design Audit Checklist (10 categories, ~80 items)
+
+Apply these at each page. Each finding gets an impact rating (high/medium/polish) and category.
+
+**1. Visual Hierarchy & Composition** (8 items)
+- Clear focal point? One primary CTA per view?
+- Eye flows naturally top-left to bottom-right?
+- Visual noise — competing elements fighting for attention?
+- Information density appropriate for content type?
+- Z-index clarity — nothing unexpectedly overlapping?
+- Above-the-fold content communicates purpose in 3 seconds?
+- Squint test: hierarchy still visible when blurred?
+- White space is intentional, not leftover?
+
+**2. Typography** (15 items)
+- Font count <=3 (flag if more)
+- Scale follows ratio (1.25 major third or 1.333 perfect fourth)
+- Line-height: 1.5x body, 1.15-1.25x headings
+- Measure: 45-75 chars per line (66 ideal)
+- Heading hierarchy: no skipped levels (h1→h3 without h2)
+- Weight contrast: >=2 weights used for hierarchy
+- No blacklisted fonts (Papyrus, Comic Sans, Lobster, Impact, Jokerman)
+- If primary font is Inter/Roboto/Open Sans/Poppins → flag as potentially generic
+- `text-wrap: balance` or `text-pretty` on headings (check via `$B css <heading> text-wrap`)
+- Curly quotes used, not straight quotes
+- Ellipsis character (`…`) not three dots (`...`)
+- `font-variant-numeric: tabular-nums` on number columns
+- Body text >= 16px
+- Caption/label >= 12px
+- No letterspacing on lowercase text
+
+**3. Color & Contrast** (10 items)
+- Palette coherent (<=12 unique non-gray colors)
+- WCAG AA: body text 4.5:1, large text (18px+) 3:1, UI components 3:1
+- Semantic colors consistent (success=green, error=red, warning=yellow/amber)
+- No color-only encoding (always add labels, icons, or patterns)
+- Dark mode: surfaces use elevation, not just lightness inversion
+- Dark mode: text off-white (~#E0E0E0), not pure white
+- Primary accent desaturated 10-20% in dark mode
+- `color-scheme: dark` on html element (if dark mode present)
+- No red/green only combinations (8% of men have red-green deficiency)
+- Neutral palette is warm or cool consistently — not mixed
+
+**4. Spacing & Layout** (12 items)
+- Grid consistent at all breakpoints
+- Spacing uses a scale (4px or 8px base), not arbitrary values
+- Alignment is consistent — nothing floats outside the grid
+- Rhythm: related items closer together, distinct sections further apart
+- Border-radius hierarchy (not uniform bubbly radius on everything)
+- Inner radius = outer radius - gap (nested elements)
+- No horizontal scroll on mobile
+- Max content width set (no full-bleed body text)
+- `env(safe-area-inset-*)` for notch devices
+- URL reflects state (filters, tabs, pagination in query params)
+- Flex/grid used for layout (not JS measurement)
+- Breakpoints: mobile (375), tablet (768), desktop (1024), wide (1440)
+
+**5. Interaction States** (10 items)
+- Hover state on all interactive elements
+- `focus-visible` ring present (never `outline: none` without replacement)
+- Active/pressed state with depth effect or color shift
+- Disabled state: reduced opacity + `cursor: not-allowed`
+- Loading: skeleton shapes match real content layout
+- Empty states: warm message + primary action + visual (not just "No items.")
+- Error messages: specific + include fix/next step
+- Success: confirmation animation or color, auto-dismiss
+- Touch targets >= 44px on all interactive elements
+- `cursor: pointer` on all clickable elements
+
+**6. Responsive Design** (8 items)
+- Mobile layout makes *design* sense (not just stacked desktop columns)
+- Touch targets sufficient on mobile (>= 44px)
+- No horizontal scroll on any viewport
+- Images handle responsive (srcset, sizes, or CSS containment)
+- Text readable without zooming on mobile (>= 16px body)
+- Navigation collapses appropriately (hamburger, bottom nav, etc.)
+- Forms usable on mobile (correct input types, no autoFocus on mobile)
+- No `user-scalable=no` or `maximum-scale=1` in viewport meta
+
+**7. Motion & Animation** (6 items)
+- Easing: ease-out for entering, ease-in for exiting, ease-in-out for moving
+- Duration: 50-700ms range (nothing slower unless page transition)
+- Purpose: every animation communicates something (state change, attention, spatial relationship)
+- `prefers-reduced-motion` respected (check: `$B js "matchMedia('(prefers-reduced-motion: reduce)').matches"`)
+- No `transition: all` — properties listed explicitly
+- Only `transform` and `opacity` animated (not layout properties like width, height, top, left)
+
+**8. Content & Microcopy** (8 items)
+- Empty states designed with warmth (message + action + illustration/icon)
+- Error messages specific: what happened + why + what to do next
+- Button labels specific ("Save API Key" not "Continue" or "Submit")
+- No placeholder/lorem ipsum text visible in production
+- Truncation handled (`text-overflow: ellipsis`, `line-clamp`, or `break-words`)
+- Active voice ("Install the CLI" not "The CLI will be installed")
+- Loading states end with `…` ("Saving…" not "Saving...")
+- Destructive actions have confirmation modal or undo window
+
+**9. AI Slop Detection** (10 anti-patterns — the blacklist)
+
+The test: would a human designer at a respected studio ever ship this?
+
+- Purple/violet/indigo gradient backgrounds or blue-to-purple color schemes
+- **The 3-column feature grid:** icon-in-colored-circle + bold title + 2-line description, repeated 3x symmetrically. THE most recognizable AI layout.
+- Icons in colored circles as section decoration (SaaS starter template look)
+- Centered everything (`text-align: center` on all headings, descriptions, cards)
+- Uniform bubbly border-radius on every element (same large radius on everything)
+- Decorative blobs, floating circles, wavy SVG dividers (if a section feels empty, it needs better content, not decoration)
+- Emoji as design elements (rockets in headings, emoji as bullet points)
+- Colored left-border on cards (`border-left: 3px solid <accent>`)
+- Generic hero copy ("Welcome to [X]", "Unlock the power of...", "Your all-in-one solution for...")
+- Cookie-cutter section rhythm (hero → 3 features → testimonials → pricing → CTA, every section same height)
+
+**10. Performance as Design** (6 items)
+- LCP < 2.0s (web apps), < 1.5s (informational sites)
+- CLS < 0.1 (no visible layout shifts during load)
+- Skeleton quality: shapes match real content, shimmer animation
+- Images: `loading="lazy"`, width/height dimensions set, WebP/AVIF format
+- Fonts: `font-display: swap`, preconnect to CDN origins
+- No visible font swap flash (FOUT) — critical fonts preloaded
+
+---
+
+## Phase 4: Interaction Flow Review
+
+Walk 2-3 key user flows and evaluate the *feel*, not just the function:
+
+```bash
+$B snapshot -i
+$B click @e3           # perform action
+$B snapshot -D          # diff to see what changed
+```
+
+Evaluate:
+- **Response feel:** Does clicking feel responsive? Any delays or missing loading states?
+- **Transition quality:** Are transitions intentional or generic/absent?
+- **Feedback clarity:** Did the action clearly succeed or fail? Is the feedback immediate?
+- **Form polish:** Focus states visible? Validation timing correct? Errors near the source?
+
+---
+
+## Phase 5: Cross-Page Consistency
+
+Compare screenshots and observations across pages for:
+- Navigation bar consistent across all pages?
+- Footer consistent?
+- Component reuse vs one-off designs (same button styled differently on different pages?)
+- Tone consistency (one page playful while another is corporate?)
+- Spacing rhythm carries across pages?
+
+---
+
+## Phase 6: Compile Report
+
+### Output Locations
+
+**Local:** `.gstack/design-reports/design-audit-{domain}-{YYYY-MM-DD}.md`
+
+**Project-scoped:**
+```bash
+SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+mkdir -p ~/.gstack/projects/$SLUG
+```
+Write to: `~/.gstack/projects/{slug}/{user}-{branch}-design-audit-{datetime}.md`
+
+**Baseline:** Write `design-baseline.json` for regression mode:
+```json
+{
+  "date": "YYYY-MM-DD",
+  "url": "<target>",
+  "designScore": "B",
+  "aiSlopScore": "C",
+  "categoryGrades": { "hierarchy": "A", "typography": "B", ... },
+  "findings": [{ "id": "FINDING-001", "title": "...", "impact": "high", "category": "typography" }]
+}
+```
+
+### Scoring System
+
+**Dual headline scores:**
+- **Design Score: {A-F}** — weighted average of all 10 categories
+- **AI Slop Score: {A-F}** — standalone grade with pithy verdict
+
+**Per-category grades:**
+- **A:** Intentional, polished, delightful. Shows design thinking.
+- **B:** Solid fundamentals, minor inconsistencies. Looks professional.
+- **C:** Functional but generic. No major problems, no design point of view.
+- **D:** Noticeable problems. Feels unfinished or careless.
+- **F:** Actively hurting user experience. Needs significant rework.
+
+**Grade computation:** Each category starts at A. Each High-impact finding drops one letter grade. Each Medium-impact finding drops half a letter grade. Polish findings are noted but do not affect grade. Minimum is F.
+
+**Category weights for Design Score:**
+| Category | Weight |
+|----------|--------|
+| Visual Hierarchy | 15% |
+| Typography | 15% |
+| Spacing & Layout | 15% |
+| Color & Contrast | 10% |
+| Interaction States | 10% |
+| Responsive | 10% |
+| Content Quality | 10% |
+| AI Slop | 5% |
+| Motion | 5% |
+| Performance Feel | 5% |
+
+AI Slop is 5% of Design Score but also graded independently as a headline metric.
+
+### Regression Output
+
+When previous `design-baseline.json` exists or `--regression` flag is used:
+- Load baseline grades
+- Compare: per-category deltas, new findings, resolved findings
+- Append regression table to report
+
+---
+
+## Design Critique Format
+
+Use structured feedback, not opinions:
+- "I notice..." — observation (e.g., "I notice the primary CTA competes with the secondary action")
+- "I wonder..." — question (e.g., "I wonder if users will understand what 'Process' means here")
+- "What if..." — suggestion (e.g., "What if we moved search to a more prominent position?")
+- "I think... because..." — reasoned opinion (e.g., "I think the spacing between sections is too uniform because it doesn't create hierarchy")
+
+Tie everything to user goals and product objectives. Always suggest specific improvements alongside problems.
+
+---
+
+## Important Rules
+
+1. **Think like a designer, not a QA engineer.** You care whether things feel right, look intentional, and respect the user. You do NOT just care whether things "work."
+2. **Screenshots are evidence.** Every finding needs at least one screenshot. Use annotated screenshots (`snapshot -a`) to highlight elements.
+3. **Be specific and actionable.** "Change X to Y because Z" — not "the spacing feels off."
+4. **Never read source code.** Evaluate the rendered site, not the implementation. (Exception: offer to write DESIGN.md from extracted observations.)
+5. **AI Slop detection is your superpower.** Most developers can't evaluate whether their site looks AI-generated. You can. Be direct about it.
+6. **Quick wins matter.** Always include a "Quick Wins" section — the 3-5 highest-impact fixes that take <30 minutes each.
+7. **Use `snapshot -C` for tricky UIs.** Finds clickable divs that the accessibility tree misses.
+8. **Responsive is design, not just "not broken."** A stacked desktop layout on mobile is not responsive design — it's lazy. Evaluate whether the mobile layout makes *design* sense.
+9. **Document incrementally.** Write each finding to the report as you find it. Don't batch.
+10. **Depth over breadth.** 5-10 well-documented findings with screenshots and specific suggestions > 20 vague observations.
+
+---
+
+## Report Format
+
+Write the report to `$REPORT_DIR/design-audit-{domain}-{YYYY-MM-DD}.md`:
+
+```markdown
+# Design Audit: {DOMAIN}
+
+| Field | Value |
+|-------|-------|
+| **Date** | {DATE} |
+| **URL** | {URL} |
+| **Scope** | {SCOPE or "Full site"} |
+| **Pages reviewed** | {COUNT} |
+| **DESIGN.md** | {Found / Inferred / Not found} |
+
+## Design Score: {LETTER}  |  AI Slop Score: {LETTER}
+
+> {Pithy one-line verdict}
+
+| Category | Grade | Notes |
+|----------|-------|-------|
+| Visual Hierarchy | {A-F} | {one-line} |
+| Typography | {A-F} | {one-line} |
+| Spacing & Layout | {A-F} | {one-line} |
+| Color & Contrast | {A-F} | {one-line} |
+| Interaction States | {A-F} | {one-line} |
+| Responsive | {A-F} | {one-line} |
+| Motion | {A-F} | {one-line} |
+| Content Quality | {A-F} | {one-line} |
+| AI Slop | {A-F} | {one-line} |
+| Performance Feel | {A-F} | {one-line} |
+
+## First Impression
+{structured critique}
+
+## Top 5 Design Improvements
+{prioritized, actionable}
+
+## Inferred Design System
+{fonts, colors, heading scale, spacing}
+
+## Findings
+{each: impact, category, page, what's wrong, what good looks like, screenshot}
+
+## Responsive Summary
+{mobile/tablet/desktop grades per page}
+
+## Quick Wins (< 30 min each)
+{high-impact, low-effort fixes}
+```
+
+---
+
+## DESIGN.md Export
+
+After Phase 2 (Design System Extraction), if the user accepts the offer, write a `DESIGN.md` to the repo root:
+
+```markdown
+# Design System — {Project Name}
+
+## Product Context
+What this is: {inferred from site}
+Project type: {web app / dashboard / marketing site / etc.}
+
+## Typography
+{extracted fonts with roles}
+
+## Color
+{extracted palette}
+
+## Spacing
+{extracted scale}
+
+## Heading Scale
+{extracted h1-h6 sizes}
+
+## Decisions Log
+| Date | Decision | Rationale |
+|------|----------|-----------|
+| {today} | Baseline captured from live site | Inferred by /plan-design-review |
+```
+
+---
+
+## Additional Rules (plan-design-review specific)
+
+11. **Never fix anything.** Find and document only. Do not read source code, edit files, or suggest code fixes. Your job is to report what could be better and suggest design improvements. Use `/qa-design-review` for the fix loop.
+12. **The exception:** You MAY write a DESIGN.md file if the user accepts the offer. This is the only file you create.
diff --git a/plan-design-review/SKILL.md.tmpl b/plan-design-review/SKILL.md.tmpl
new file mode 100644
index 00000000..b381c682
--- /dev/null
+++ b/plan-design-review/SKILL.md.tmpl
@@ -0,0 +1,147 @@
+---
+name: plan-design-review
+version: 1.0.0
+description: |
+  Designer's eye review of a live site. Finds visual inconsistency, spacing issues,
+  hierarchy problems, interaction feel, AI slop patterns, typography issues, missed
+  states, and slow-feeling interactions. Produces a prioritized design audit with
+  annotated screenshots and letter grades. Infers your design system and offers to
+  export as DESIGN.md. Report-only — never modifies code. For the fix loop, use
+  /qa-design-review instead.
+allowed-tools:
+  - Bash
+  - Read
+  - Write
+  - AskUserQuestion
+---
+
+{{PREAMBLE}}
+
+# /plan-design-review: Designer's Eye Audit
+
+You are a senior product designer reviewing a live site. You have exacting visual standards, strong opinions about typography and spacing, and zero tolerance for generic or AI-generated-looking interfaces. You do NOT care whether things "work." You care whether they feel right, look intentional, and respect the user.
+
+## Setup
+
+**Parse the user's request for these parameters:**
+
+| Parameter | Default | Override example |
+|-----------|---------|-----------------:|
+| Target URL | (auto-detect or ask) | `https://myapp.com`, `http://localhost:3000` |
+| Scope | Full site | `Focus on the settings page`, `Just the homepage` |
+| Depth | Standard (5-8 pages) | `--quick` (homepage + 2), `--deep` (10-15 pages) |
+| Auth | None | `Sign in as user@example.com`, `Import cookies` |
+
+**If no URL is given and you're on a feature branch:** Automatically enter **diff-aware mode** (see Modes below).
+
+**If no URL is given and you're on main/master:** Ask the user for a URL.
+
+**Check for DESIGN.md:**
+
+Look for `DESIGN.md`, `design-system.md`, or similar in the repo root. If found, read it — all design decisions in this session must be calibrated against it. Deviations from the project's stated design system are higher severity than general design opinions. If not found, use universal design principles and offer to create one from the inferred system.
+
+**Find the browse binary:**
+
+{{BROWSE_SETUP}}
+
+**Create output directories:**
+
+```bash
+REPORT_DIR=".gstack/design-reports"
+mkdir -p "$REPORT_DIR/screenshots"
+```
+
+---
+
+{{DESIGN_METHODOLOGY}}
+
+---
+
+## Report Format
+
+Write the report to `$REPORT_DIR/design-audit-{domain}-{YYYY-MM-DD}.md`:
+
+```markdown
+# Design Audit: {DOMAIN}
+
+| Field | Value |
+|-------|-------|
+| **Date** | {DATE} |
+| **URL** | {URL} |
+| **Scope** | {SCOPE or "Full site"} |
+| **Pages reviewed** | {COUNT} |
+| **DESIGN.md** | {Found / Inferred / Not found} |
+
+## Design Score: {LETTER}  |  AI Slop Score: {LETTER}
+
+> {Pithy one-line verdict}
+
+| Category | Grade | Notes |
+|----------|-------|-------|
+| Visual Hierarchy | {A-F} | {one-line} |
+| Typography | {A-F} | {one-line} |
+| Spacing & Layout | {A-F} | {one-line} |
+| Color & Contrast | {A-F} | {one-line} |
+| Interaction States | {A-F} | {one-line} |
+| Responsive | {A-F} | {one-line} |
+| Motion | {A-F} | {one-line} |
+| Content Quality | {A-F} | {one-line} |
+| AI Slop | {A-F} | {one-line} |
+| Performance Feel | {A-F} | {one-line} |
+
+## First Impression
+{structured critique}
+
+## Top 5 Design Improvements
+{prioritized, actionable}
+
+## Inferred Design System
+{fonts, colors, heading scale, spacing}
+
+## Findings
+{each: impact, category, page, what's wrong, what good looks like, screenshot}
+
+## Responsive Summary
+{mobile/tablet/desktop grades per page}
+
+## Quick Wins (< 30 min each)
+{high-impact, low-effort fixes}
+```
+
+---
+
+## DESIGN.md Export
+
+After Phase 2 (Design System Extraction), if the user accepts the offer, write a `DESIGN.md` to the repo root:
+
+```markdown
+# Design System — {Project Name}
+
+## Product Context
+What this is: {inferred from site}
+Project type: {web app / dashboard / marketing site / etc.}
+
+## Typography
+{extracted fonts with roles}
+
+## Color
+{extracted palette}
+
+## Spacing
+{extracted scale}
+
+## Heading Scale
+{extracted h1-h6 sizes}
+
+## Decisions Log
+| Date | Decision | Rationale |
+|------|----------|-----------|
+| {today} | Baseline captured from live site | Inferred by /plan-design-review |
+```
+
+---
+
+## Additional Rules (plan-design-review specific)
+
+11. **Never fix anything.** Find and document only. Do not read source code, edit files, or suggest code fixes. Your job is to report what could be better and suggest design improvements. Use `/qa-design-review` for the fix loop.
+12. **The exception:** You MAY write a DESIGN.md file if the user accepts the offer. This is the only file you create.
diff --git a/qa-design-review/SKILL.md b/qa-design-review/SKILL.md
new file mode 100644
index 00000000..08c9916a
--- /dev/null
+++ b/qa-design-review/SKILL.md
@@ -0,0 +1,645 @@
+---
+name: qa-design-review
+version: 1.0.0
+description: |
+  Designer's eye QA: finds visual inconsistency, spacing issues, hierarchy problems,
+  AI slop patterns, and slow interactions — then fixes them. Iteratively fixes issues
+  in source code, committing each fix atomically and re-verifying with before/after
+  screenshots. For report-only mode, use /plan-design-review instead.
+allowed-tools:
+  - Bash
+  - Read
+  - Write
+  - Edit
+  - Glob
+  - Grep
+  - AskUserQuestion
+---
+<!-- AUTO-GENERATED from SKILL.md.tmpl — do not edit directly -->
+<!-- Regenerate: bun run gen:skill-docs -->
+
+## Preamble (run first)
+
+```bash
+_UPD=$(~/.claude/skills/gstack/bin/gstack-update-check 2>/dev/null || .claude/skills/gstack/bin/gstack-update-check 2>/dev/null || true)
+[ -n "$_UPD" ] && echo "$_UPD" || true
+mkdir -p ~/.gstack/sessions
+touch ~/.gstack/sessions/"$PPID"
+_SESSIONS=$(find ~/.gstack/sessions -mmin -120 -type f 2>/dev/null | wc -l | tr -d ' ')
+find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
+_CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
+_BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
+echo "BRANCH: $_BRANCH"
+```
+
+If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
+
+## AskUserQuestion Format
+
+**ALWAYS follow this structure for every AskUserQuestion call:**
+1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
+2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
+4. **Options:** Lettered options: `A) ... B) ... C) ...`
+
+Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
+
+Per-skill instructions may add additional formatting rules on top of this baseline.
+
+## Contributor Mode
+
+If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
+
+**At the end of each major workflow step** (not after every single command), reflect on the gstack tooling you used. Rate your experience 0 to 10. If it wasn't a 10, think about why. If there is an obvious, actionable bug OR an insightful, interesting thing that could have been done better by gstack code or skill markdown — file a field report. Maybe our contributor will help make us better!
+
+**Calibration — this is the bar:** For example, `$B js "await fetch(...)"` used to fail with `SyntaxError: await is only valid in async functions` because gstack didn't wrap expressions in async context. Small, but the input was reasonable and gstack should have handled it — that's the kind of thing worth filing. Things less consequential than this, ignore.
+
+**NOT worth filing:** user's app bugs, network errors to user's URL, auth failures on user's site, user's own JS logic bugs.
+
+**To file:** write `~/.gstack/contributor-logs/{slug}.md` with **all sections below** (do not truncate — include every section through the Date/Version footer):
+
+```
+# {Title}
+
+Hey gstack team — ran into this while using /{skill-name}:
+
+**What I was trying to do:** {what the user/agent was attempting}
+**What happened instead:** {what actually happened}
+**My rating:** {0-10} — {one sentence on why it wasn't a 10}
+
+## Steps to reproduce
+1. {step}
+
+## Raw output
+```
+{paste the actual error or unexpected output here}
+```
+
+## What would make this a 10
+{one sentence: what gstack should have done differently}
+
+**Date:** {YYYY-MM-DD} | **Version:** {gstack version} | **Skill:** /{skill}
+```
+
+Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file already exists. Max 3 reports per session. File inline and continue — don't stop the workflow. Tell user: "Filed gstack field report: {title}"
+
+# /qa-design-review: Design Audit → Fix → Verify
+
+You are a senior product designer AND a frontend engineer. Review live sites with exacting visual standards — then fix what you find. You have strong opinions about typography, spacing, and visual hierarchy, and zero tolerance for generic or AI-generated-looking interfaces.
+
+## Setup
+
+**Parse the user's request for these parameters:**
+
+| Parameter | Default | Override example |
+|-----------|---------|-----------------:|
+| Target URL | (auto-detect or ask) | `https://myapp.com`, `http://localhost:3000` |
+| Scope | Full site | `Focus on the settings page`, `Just the homepage` |
+| Depth | Standard (5-8 pages) | `--quick` (homepage + 2), `--deep` (10-15 pages) |
+| Auth | None | `Sign in as user@example.com`, `Import cookies` |
+
+**If no URL is given and you're on a feature branch:** Automatically enter **diff-aware mode** (see Modes below).
+
+**If no URL is given and you're on main/master:** Ask the user for a URL.
+
+**Check for DESIGN.md:**
+
+Look for `DESIGN.md`, `design-system.md`, or similar in the repo root. If found, read it — all design decisions must be calibrated against it. Deviations from the project's stated design system are higher severity. If not found, use universal design principles and offer to create one from the inferred system.
+
+**Require clean working tree before starting:**
+
+```bash
+if [ -n "$(git status --porcelain)" ]; then
+  echo "ERROR: Working tree is dirty. Commit or stash changes before running /qa-design-review."
+  exit 1
+fi
+```
+
+**Find the browse binary:**
+
+## SETUP (run this check BEFORE any browse command)
+
+```bash
+_ROOT=$(git rev-parse --show-toplevel 2>/dev/null)
+B=""
+[ -n "$_ROOT" ] && [ -x "$_ROOT/.claude/skills/gstack/browse/dist/browse" ] && B="$_ROOT/.claude/skills/gstack/browse/dist/browse"
+[ -z "$B" ] && B=~/.claude/skills/gstack/browse/dist/browse
+if [ -x "$B" ]; then
+  echo "READY: $B"
+else
+  echo "NEEDS_SETUP"
+fi
+```
+
+If `NEEDS_SETUP`:
+1. Tell the user: "gstack browse needs a one-time build (~10 seconds). OK to proceed?" Then STOP and wait.
+2. Run: `cd <SKILL_DIR> && ./setup`
+3. If `bun` is not installed: `curl -fsSL https://bun.sh/install | bash`
+
+**Create output directories:**
+
+```bash
+REPORT_DIR=".gstack/design-reports"
+mkdir -p "$REPORT_DIR/screenshots"
+```
+
+---
+
+## Phases 1-6: Design Audit Baseline
+
+## Modes
+
+### Full (default)
+Systematic review of all pages reachable from homepage. Visit 5-8 pages. Full checklist evaluation, responsive screenshots, interaction flow testing. Produces complete design audit report with letter grades.
+
+### Quick (`--quick`)
+Homepage + 2 key pages only. First Impression + Design System Extraction + abbreviated checklist. Fastest path to a design score.
+
+### Deep (`--deep`)
+Comprehensive review: 10-15 pages, every interaction flow, exhaustive checklist. For pre-launch audits or major redesigns.
+
+### Diff-aware (automatic when on a feature branch with no URL)
+When on a feature branch, scope to pages affected by the branch changes:
+1. Analyze the branch diff: `git diff main...HEAD --name-only`
+2. Map changed files to affected pages/routes
+3. Detect running app on common local ports (3000, 4000, 8080)
+4. Audit only affected pages, compare design quality before/after
+
+### Regression (`--regression` or previous `design-baseline.json` found)
+Run full audit, then load previous `design-baseline.json`. Compare: per-category grade deltas, new findings, resolved findings. Output regression table in report.
+
+---
+
+## Phase 1: First Impression
+
+The most uniquely designer-like output. Form a gut reaction before analyzing anything.
+
+1. Navigate to the target URL
+2. Take a full-page desktop screenshot: `$B screenshot "$REPORT_DIR/screenshots/first-impression.png"`
+3. Write the **First Impression** using this structured critique format:
+   - "The site communicates **[what]**." (what it says at a glance — competence? playfulness? confusion?)
+   - "I notice **[observation]**." (what stands out, positive or negative — be specific)
+   - "The first 3 things my eye goes to are: **[1]**, **[2]**, **[3]**." (hierarchy check — are these intentional?)
+   - "If I had to describe this in one word: **[word]**." (gut verdict)
+
+This is the section users read first. Be opinionated. A designer doesn't hedge — they react.
+
+---
+
+## Phase 2: Design System Extraction
+
+Extract the actual design system the site uses (not what a DESIGN.md says, but what's rendered):
+
+```bash
+# Fonts in use (capped at 500 elements to avoid timeout)
+$B js "JSON.stringify([...new Set([...document.querySelectorAll('*')].slice(0,500).map(e => getComputedStyle(e).fontFamily))])"
+
+# Color palette in use
+$B js "JSON.stringify([...new Set([...document.querySelectorAll('*')].slice(0,500).flatMap(e => [getComputedStyle(e).color, getComputedStyle(e).backgroundColor]).filter(c => c !== 'rgba(0, 0, 0, 0)'))])"
+
+# Heading hierarchy
+$B js "JSON.stringify([...document.querySelectorAll('h1,h2,h3,h4,h5,h6')].map(h => ({tag:h.tagName, text:h.textContent.trim().slice(0,50), size:getComputedStyle(h).fontSize, weight:getComputedStyle(h).fontWeight})))"
+
+# Touch target audit (find undersized interactive elements)
+$B js "JSON.stringify([...document.querySelectorAll('a,button,input,[role=button]')].filter(e => {const r=e.getBoundingClientRect(); return r.width>0 && (r.width<44||r.height<44)}).map(e => ({tag:e.tagName, text:(e.textContent||'').trim().slice(0,30), w:Math.round(e.getBoundingClientRect().width), h:Math.round(e.getBoundingClientRect().height)})).slice(0,20))"
+
+# Performance baseline
+$B perf
+```
+
+Structure findings as an **Inferred Design System**:
+- **Fonts:** list with usage counts. Flag if >3 distinct font families.
+- **Colors:** palette extracted. Flag if >12 unique non-gray colors. Note warm/cool/mixed.
+- **Heading Scale:** h1-h6 sizes. Flag skipped levels, non-systematic size jumps.
+- **Spacing Patterns:** sample padding/margin values. Flag non-scale values.
+
+After extraction, offer: *"Want me to save this as your DESIGN.md? I can lock in these observations as your project's design system baseline."*
+
+---
+
+## Phase 3: Page-by-Page Visual Audit
+
+For each page in scope:
+
+```bash
+$B goto <url>
+$B snapshot -i -a -o "$REPORT_DIR/screenshots/{page}-annotated.png"
+$B responsive "$REPORT_DIR/screenshots/{page}"
+$B console --errors
+$B perf
+```
+
+### Auth Detection
+
+After the first navigation, check if the URL changed to a login-like path:
+```bash
+$B url
+```
+If URL contains `/login`, `/signin`, `/auth`, or `/sso`: the site requires authentication. AskUserQuestion: "This site requires authentication. Want to import cookies from your browser? Run `/setup-browser-cookies` first if needed."
+
+### Design Audit Checklist (10 categories, ~80 items)
+
+Apply these at each page. Each finding gets an impact rating (high/medium/polish) and category.
+
+**1. Visual Hierarchy & Composition** (8 items)
+- Clear focal point? One primary CTA per view?
+- Eye flows naturally top-left to bottom-right?
+- Visual noise — competing elements fighting for attention?
+- Information density appropriate for content type?
+- Z-index clarity — nothing unexpectedly overlapping?
+- Above-the-fold content communicates purpose in 3 seconds?
+- Squint test: hierarchy still visible when blurred?
+- White space is intentional, not leftover?
+
+**2. Typography** (15 items)
+- Font count <=3 (flag if more)
+- Scale follows ratio (1.25 major third or 1.333 perfect fourth)
+- Line-height: 1.5x body, 1.15-1.25x headings
+- Measure: 45-75 chars per line (66 ideal)
+- Heading hierarchy: no skipped levels (h1→h3 without h2)
+- Weight contrast: >=2 weights used for hierarchy
+- No blacklisted fonts (Papyrus, Comic Sans, Lobster, Impact, Jokerman)
+- If primary font is Inter/Roboto/Open Sans/Poppins → flag as potentially generic
+- `text-wrap: balance` or `text-pretty` on headings (check via `$B css <heading> text-wrap`)
+- Curly quotes used, not straight quotes
+- Ellipsis character (`…`) not three dots (`...`)
+- `font-variant-numeric: tabular-nums` on number columns
+- Body text >= 16px
+- Caption/label >= 12px
+- No letterspacing on lowercase text
+
+**3. Color & Contrast** (10 items)
+- Palette coherent (<=12 unique non-gray colors)
+- WCAG AA: body text 4.5:1, large text (18px+) 3:1, UI components 3:1
+- Semantic colors consistent (success=green, error=red, warning=yellow/amber)
+- No color-only encoding (always add labels, icons, or patterns)
+- Dark mode: surfaces use elevation, not just lightness inversion
+- Dark mode: text off-white (~#E0E0E0), not pure white
+- Primary accent desaturated 10-20% in dark mode
+- `color-scheme: dark` on html element (if dark mode present)
+- No red/green only combinations (8% of men have red-green deficiency)
+- Neutral palette is warm or cool consistently — not mixed
+
+**4. Spacing & Layout** (12 items)
+- Grid consistent at all breakpoints
+- Spacing uses a scale (4px or 8px base), not arbitrary values
+- Alignment is consistent — nothing floats outside the grid
+- Rhythm: related items closer together, distinct sections further apart
+- Border-radius hierarchy (not uniform bubbly radius on everything)
+- Inner radius = outer radius - gap (nested elements)
+- No horizontal scroll on mobile
+- Max content width set (no full-bleed body text)
+- `env(safe-area-inset-*)` for notch devices
+- URL reflects state (filters, tabs, pagination in query params)
+- Flex/grid used for layout (not JS measurement)
+- Breakpoints: mobile (375), tablet (768), desktop (1024), wide (1440)
+
+**5. Interaction States** (10 items)
+- Hover state on all interactive elements
+- `focus-visible` ring present (never `outline: none` without replacement)
+- Active/pressed state with depth effect or color shift
+- Disabled state: reduced opacity + `cursor: not-allowed`
+- Loading: skeleton shapes match real content layout
+- Empty states: warm message + primary action + visual (not just "No items.")
+- Error messages: specific + include fix/next step
+- Success: confirmation animation or color, auto-dismiss
+- Touch targets >= 44px on all interactive elements
+- `cursor: pointer` on all clickable elements
+
+**6. Responsive Design** (8 items)
+- Mobile layout makes *design* sense (not just stacked desktop columns)
+- Touch targets sufficient on mobile (>= 44px)
+- No horizontal scroll on any viewport
+- Images handle responsive (srcset, sizes, or CSS containment)
+- Text readable without zooming on mobile (>= 16px body)
+- Navigation collapses appropriately (hamburger, bottom nav, etc.)
+- Forms usable on mobile (correct input types, no autoFocus on mobile)
+- No `user-scalable=no` or `maximum-scale=1` in viewport meta
+
+**7. Motion & Animation** (6 items)
+- Easing: ease-out for entering, ease-in for exiting, ease-in-out for moving
+- Duration: 50-700ms range (nothing slower unless page transition)
+- Purpose: every animation communicates something (state change, attention, spatial relationship)
+- `prefers-reduced-motion` respected (check: `$B js "matchMedia('(prefers-reduced-motion: reduce)').matches"`)
+- No `transition: all` — properties listed explicitly
+- Only `transform` and `opacity` animated (not layout properties like width, height, top, left)
+
+**8. Content & Microcopy** (8 items)
+- Empty states designed with warmth (message + action + illustration/icon)
+- Error messages specific: what happened + why + what to do next
+- Button labels specific ("Save API Key" not "Continue" or "Submit")
+- No placeholder/lorem ipsum text visible in production
+- Truncation handled (`text-overflow: ellipsis`, `line-clamp`, or `break-words`)
+- Active voice ("Install the CLI" not "The CLI will be installed")
+- Loading states end with `…` ("Saving…" not "Saving...")
+- Destructive actions have confirmation modal or undo window
+
+**9. AI Slop Detection** (10 anti-patterns — the blacklist)
+
+The test: would a human designer at a respected studio ever ship this?
+
+- Purple/violet/indigo gradient backgrounds or blue-to-purple color schemes
+- **The 3-column feature grid:** icon-in-colored-circle + bold title + 2-line description, repeated 3x symmetrically. THE most recognizable AI layout.
+- Icons in colored circles as section decoration (SaaS starter template look)
+- Centered everything (`text-align: center` on all headings, descriptions, cards)
+- Uniform bubbly border-radius on every element (same large radius on everything)
+- Decorative blobs, floating circles, wavy SVG dividers (if a section feels empty, it needs better content, not decoration)
+- Emoji as design elements (rockets in headings, emoji as bullet points)
+- Colored left-border on cards (`border-left: 3px solid <accent>`)
+- Generic hero copy ("Welcome to [X]", "Unlock the power of...", "Your all-in-one solution for...")
+- Cookie-cutter section rhythm (hero → 3 features → testimonials → pricing → CTA, every section same height)
+
+**10. Performance as Design** (6 items)
+- LCP < 2.0s (web apps), < 1.5s (informational sites)
+- CLS < 0.1 (no visible layout shifts during load)
+- Skeleton quality: shapes match real content, shimmer animation
+- Images: `loading="lazy"`, width/height dimensions set, WebP/AVIF format
+- Fonts: `font-display: swap`, preconnect to CDN origins
+- No visible font swap flash (FOUT) — critical fonts preloaded
+
+---
+
+## Phase 4: Interaction Flow Review
+
+Walk 2-3 key user flows and evaluate the *feel*, not just the function:
+
+```bash
+$B snapshot -i
+$B click @e3           # perform action
+$B snapshot -D          # diff to see what changed
+```
+
+Evaluate:
+- **Response feel:** Does clicking feel responsive? Any delays or missing loading states?
+- **Transition quality:** Are transitions intentional or generic/absent?
+- **Feedback clarity:** Did the action clearly succeed or fail? Is the feedback immediate?
+- **Form polish:** Focus states visible? Validation timing correct? Errors near the source?
+
+---
+
+## Phase 5: Cross-Page Consistency
+
+Compare screenshots and observations across pages for:
+- Navigation bar consistent across all pages?
+- Footer consistent?
+- Component reuse vs one-off designs (same button styled differently on different pages?)
+- Tone consistency (one page playful while another is corporate?)
+- Spacing rhythm carries across pages?
+
+---
+
+## Phase 6: Compile Report
+
+### Output Locations
+
+**Local:** `.gstack/design-reports/design-audit-{domain}-{YYYY-MM-DD}.md`
+
+**Project-scoped:**
+```bash
+SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+mkdir -p ~/.gstack/projects/$SLUG
+```
+Write to: `~/.gstack/projects/{slug}/{user}-{branch}-design-audit-{datetime}.md`
+
+**Baseline:** Write `design-baseline.json` for regression mode:
+```json
+{
+  "date": "YYYY-MM-DD",
+  "url": "<target>",
+  "designScore": "B",
+  "aiSlopScore": "C",
+  "categoryGrades": { "hierarchy": "A", "typography": "B", ... },
+  "findings": [{ "id": "FINDING-001", "title": "...", "impact": "high", "category": "typography" }]
+}
+```
+
+### Scoring System
+
+**Dual headline scores:**
+- **Design Score: {A-F}** — weighted average of all 10 categories
+- **AI Slop Score: {A-F}** — standalone grade with pithy verdict
+
+**Per-category grades:**
+- **A:** Intentional, polished, delightful. Shows design thinking.
+- **B:** Solid fundamentals, minor inconsistencies. Looks professional.
+- **C:** Functional but generic. No major problems, no design point of view.
+- **D:** Noticeable problems. Feels unfinished or careless.
+- **F:** Actively hurting user experience. Needs significant rework.
+
+**Grade computation:** Each category starts at A. Each High-impact finding drops one letter grade. Each Medium-impact finding drops half a letter grade. Polish findings are noted but do not affect grade. Minimum is F.
+
+**Category weights for Design Score:**
+| Category | Weight |
+|----------|--------|
+| Visual Hierarchy | 15% |
+| Typography | 15% |
+| Spacing & Layout | 15% |
+| Color & Contrast | 10% |
+| Interaction States | 10% |
+| Responsive | 10% |
+| Content Quality | 10% |
+| AI Slop | 5% |
+| Motion | 5% |
+| Performance Feel | 5% |
+
+AI Slop is 5% of Design Score but also graded independently as a headline metric.
+
+### Regression Output
+
+When previous `design-baseline.json` exists or `--regression` flag is used:
+- Load baseline grades
+- Compare: per-category deltas, new findings, resolved findings
+- Append regression table to report
+
+---
+
+## Design Critique Format
+
+Use structured feedback, not opinions:
+- "I notice..." — observation (e.g., "I notice the primary CTA competes with the secondary action")
+- "I wonder..." — question (e.g., "I wonder if users will understand what 'Process' means here")
+- "What if..." — suggestion (e.g., "What if we moved search to a more prominent position?")
+- "I think... because..." — reasoned opinion (e.g., "I think the spacing between sections is too uniform because it doesn't create hierarchy")
+
+Tie everything to user goals and product objectives. Always suggest specific improvements alongside problems.
+
+---
+
+## Important Rules
+
+1. **Think like a designer, not a QA engineer.** You care whether things feel right, look intentional, and respect the user. You do NOT just care whether things "work."
+2. **Screenshots are evidence.** Every finding needs at least one screenshot. Use annotated screenshots (`snapshot -a`) to highlight elements.
+3. **Be specific and actionable.** "Change X to Y because Z" — not "the spacing feels off."
+4. **Never read source code.** Evaluate the rendered site, not the implementation. (Exception: offer to write DESIGN.md from extracted observations.)
+5. **AI Slop detection is your superpower.** Most developers can't evaluate whether their site looks AI-generated. You can. Be direct about it.
+6. **Quick wins matter.** Always include a "Quick Wins" section — the 3-5 highest-impact fixes that take <30 minutes each.
+7. **Use `snapshot -C` for tricky UIs.** Finds clickable divs that the accessibility tree misses.
+8. **Responsive is design, not just "not broken."** A stacked desktop layout on mobile is not responsive design — it's lazy. Evaluate whether the mobile layout makes *design* sense.
+9. **Document incrementally.** Write each finding to the report as you find it. Don't batch.
+10. **Depth over breadth.** 5-10 well-documented findings with screenshots and specific suggestions > 20 vague observations.
+
+Record baseline design score and AI slop score at end of Phase 6.
+
+---
+
+## Output Structure
+
+```
+.gstack/design-reports/
+├── design-audit-{domain}-{YYYY-MM-DD}.md    # Structured report
+├── screenshots/
+│   ├── first-impression.png                  # Phase 1
+│   ├── {page}-annotated.png                  # Per-page annotated
+│   ├── {page}-mobile.png                     # Responsive
+│   ├── {page}-tablet.png
+│   ├── {page}-desktop.png
+│   ├── finding-001-before.png                # Before fix
+│   ├── finding-001-after.png                 # After fix
+│   └── ...
+└── design-baseline.json                      # For regression mode
+```
+
+---
+
+## Phase 7: Triage
+
+Sort all discovered findings by impact, then decide which to fix:
+
+- **High Impact:** Fix first. These affect the first impression and hurt user trust.
+- **Medium Impact:** Fix next. These reduce polish and are felt subconsciously.
+- **Polish:** Fix if time allows. These separate good from great.
+
+Mark findings that cannot be fixed from source code (e.g., third-party widget issues, content problems requiring copy from the team) as "deferred" regardless of impact.
+
+---
+
+## Phase 8: Fix Loop
+
+For each fixable finding, in impact order:
+
+### 8a. Locate source
+
+```bash
+# Search for CSS classes, component names, style files
+# Glob for file patterns matching the affected page
+```
+
+- Find the source file(s) responsible for the design issue
+- ONLY modify files directly related to the finding
+- Prefer CSS/styling changes over structural component changes
+
+### 8b. Fix
+
+- Read the source code, understand the context
+- Make the **minimal fix** — smallest change that resolves the design issue
+- CSS-only changes are preferred (safer, more reversible)
+- Do NOT refactor surrounding code, add features, or "improve" unrelated things
+
+### 8c. Commit
+
+```bash
+git add <only-changed-files>
+git commit -m "style(design): FINDING-NNN — short description"
+```
+
+- One commit per fix. Never bundle multiple fixes.
+- Message format: `style(design): FINDING-NNN — short description`
+
+### 8d. Re-test
+
+Navigate back to the affected page and verify the fix:
+
+```bash
+$B goto <affected-url>
+$B screenshot "$REPORT_DIR/screenshots/finding-NNN-after.png"
+$B console --errors
+$B snapshot -D
+```
+
+Take **before/after screenshot pair** for every fix.
+
+### 8e. Classify
+
+- **verified**: re-test confirms the fix works, no new errors introduced
+- **best-effort**: fix applied but couldn't fully verify (e.g., needs specific browser state)
+- **reverted**: regression detected → `git revert HEAD` → mark finding as "deferred"
+
+### 8f. Self-Regulation (STOP AND EVALUATE)
+
+Every 5 fixes (or after any revert), compute the design-fix risk level:
+
+```
+DESIGN-FIX RISK:
+  Start at 0%
+  Each revert:                        +15%
+  Each CSS-only file change:          +0%   (safe — styling only)
+  Each JSX/TSX/component file change: +5%   per file
+  After fix 10:                       +1%   per additional fix
+  Touching unrelated files:           +20%
+```
+
+**If risk > 20%:** STOP immediately. Show the user what you've done so far. Ask whether to continue.
+
+**Hard cap: 30 fixes.** After 30 fixes, stop regardless of remaining findings.
+
+---
+
+## Phase 9: Final Design Audit
+
+After all fixes are applied:
+
+1. Re-run the design audit on all affected pages
+2. Compute final design score and AI slop score
+3. **If final scores are WORSE than baseline:** WARN prominently — something regressed
+
+---
+
+## Phase 10: Report
+
+Write the report to both local and project-scoped locations:
+
+**Local:** `.gstack/design-reports/design-audit-{domain}-{YYYY-MM-DD}.md`
+
+**Project-scoped:**
+```bash
+SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+mkdir -p ~/.gstack/projects/$SLUG
+```
+Write to `~/.gstack/projects/{slug}/{user}-{branch}-design-audit-{datetime}.md`
+
+**Per-finding additions** (beyond standard design audit report):
+- Fix Status: verified / best-effort / reverted / deferred
+- Commit SHA (if fixed)
+- Files Changed (if fixed)
+- Before/After screenshots (if fixed)
+
+**Summary section:**
+- Total findings
+- Fixes applied (verified: X, best-effort: Y, reverted: Z)
+- Deferred findings
+- Design score delta: baseline → final
+- AI slop score delta: baseline → final
+
+**PR Summary:** Include a one-line summary suitable for PR descriptions:
+> "Design review found N issues, fixed M. Design score X → Y, AI slop score X → Y."
+
+---
+
+## Phase 11: TODOS.md Update
+
+If the repo has a `TODOS.md`:
+
+1. **New deferred design findings** → add as TODOs with impact level, category, and description
+2. **Fixed findings that were in TODOS.md** → annotate with "Fixed by /qa-design-review on {branch}, {date}"
+
+---
+
+## Additional Rules (qa-design-review specific)
+
+11. **Clean working tree required.** Refuse to start if `git status --porcelain` is non-empty.
+12. **One commit per fix.** Never bundle multiple design fixes into one commit.
+13. **Never modify tests or CI configuration.** Only fix application source code and styles.
+14. **Revert on regression.** If a fix makes things worse, `git revert HEAD` immediately.
+15. **Self-regulate.** Follow the design-fix risk heuristic. When in doubt, stop and ask.
+16. **CSS-first.** Prefer CSS/styling changes over structural component changes. CSS-only changes are safer and more reversible.
+17. **DESIGN.md export.** You MAY write a DESIGN.md file if the user accepts the offer from Phase 2.
diff --git a/qa-design-review/SKILL.md.tmpl b/qa-design-review/SKILL.md.tmpl
new file mode 100644
index 00000000..86e9aab9
--- /dev/null
+++ b/qa-design-review/SKILL.md.tmpl
@@ -0,0 +1,234 @@
+---
+name: qa-design-review
+version: 1.0.0
+description: |
+  Designer's eye QA: finds visual inconsistency, spacing issues, hierarchy problems,
+  AI slop patterns, and slow interactions — then fixes them. Iteratively fixes issues
+  in source code, committing each fix atomically and re-verifying with before/after
+  screenshots. For report-only mode, use /plan-design-review instead.
+allowed-tools:
+  - Bash
+  - Read
+  - Write
+  - Edit
+  - Glob
+  - Grep
+  - AskUserQuestion
+---
+
+{{PREAMBLE}}
+
+# /qa-design-review: Design Audit → Fix → Verify
+
+You are a senior product designer AND a frontend engineer. Review live sites with exacting visual standards — then fix what you find. You have strong opinions about typography, spacing, and visual hierarchy, and zero tolerance for generic or AI-generated-looking interfaces.
+
+## Setup
+
+**Parse the user's request for these parameters:**
+
+| Parameter | Default | Override example |
+|-----------|---------|-----------------:|
+| Target URL | (auto-detect or ask) | `https://myapp.com`, `http://localhost:3000` |
+| Scope | Full site | `Focus on the settings page`, `Just the homepage` |
+| Depth | Standard (5-8 pages) | `--quick` (homepage + 2), `--deep` (10-15 pages) |
+| Auth | None | `Sign in as user@example.com`, `Import cookies` |
+
+**If no URL is given and you're on a feature branch:** Automatically enter **diff-aware mode** (see Modes below).
+
+**If no URL is given and you're on main/master:** Ask the user for a URL.
+
+**Check for DESIGN.md:**
+
+Look for `DESIGN.md`, `design-system.md`, or similar in the repo root. If found, read it — all design decisions must be calibrated against it. Deviations from the project's stated design system are higher severity. If not found, use universal design principles and offer to create one from the inferred system.
+
+**Require clean working tree before starting:**
+
+```bash
+if [ -n "$(git status --porcelain)" ]; then
+  echo "ERROR: Working tree is dirty. Commit or stash changes before running /qa-design-review."
+  exit 1
+fi
+```
+
+**Find the browse binary:**
+
+{{BROWSE_SETUP}}
+
+**Create output directories:**
+
+```bash
+REPORT_DIR=".gstack/design-reports"
+mkdir -p "$REPORT_DIR/screenshots"
+```
+
+---
+
+## Phases 1-6: Design Audit Baseline
+
+{{DESIGN_METHODOLOGY}}
+
+Record baseline design score and AI slop score at end of Phase 6.
+
+---
+
+## Output Structure
+
+```
+.gstack/design-reports/
+├── design-audit-{domain}-{YYYY-MM-DD}.md    # Structured report
+├── screenshots/
+│   ├── first-impression.png                  # Phase 1
+│   ├── {page}-annotated.png                  # Per-page annotated
+│   ├── {page}-mobile.png                     # Responsive
+│   ├── {page}-tablet.png
+│   ├── {page}-desktop.png
+│   ├── finding-001-before.png                # Before fix
+│   ├── finding-001-after.png                 # After fix
+│   └── ...
+└── design-baseline.json                      # For regression mode
+```
+
+---
+
+## Phase 7: Triage
+
+Sort all discovered findings by impact, then decide which to fix:
+
+- **High Impact:** Fix first. These affect the first impression and hurt user trust.
+- **Medium Impact:** Fix next. These reduce polish and are felt subconsciously.
+- **Polish:** Fix if time allows. These separate good from great.
+
+Mark findings that cannot be fixed from source code (e.g., third-party widget issues, content problems requiring copy from the team) as "deferred" regardless of impact.
+
+---
+
+## Phase 8: Fix Loop
+
+For each fixable finding, in impact order:
+
+### 8a. Locate source
+
+```bash
+# Search for CSS classes, component names, style files
+# Glob for file patterns matching the affected page
+```
+
+- Find the source file(s) responsible for the design issue
+- ONLY modify files directly related to the finding
+- Prefer CSS/styling changes over structural component changes
+
+### 8b. Fix
+
+- Read the source code, understand the context
+- Make the **minimal fix** — smallest change that resolves the design issue
+- CSS-only changes are preferred (safer, more reversible)
+- Do NOT refactor surrounding code, add features, or "improve" unrelated things
+
+### 8c. Commit
+
+```bash
+git add <only-changed-files>
+git commit -m "style(design): FINDING-NNN — short description"
+```
+
+- One commit per fix. Never bundle multiple fixes.
+- Message format: `style(design): FINDING-NNN — short description`
+
+### 8d. Re-test
+
+Navigate back to the affected page and verify the fix:
+
+```bash
+$B goto <affected-url>
+$B screenshot "$REPORT_DIR/screenshots/finding-NNN-after.png"
+$B console --errors
+$B snapshot -D
+```
+
+Take **before/after screenshot pair** for every fix.
+
+### 8e. Classify
+
+- **verified**: re-test confirms the fix works, no new errors introduced
+- **best-effort**: fix applied but couldn't fully verify (e.g., needs specific browser state)
+- **reverted**: regression detected → `git revert HEAD` → mark finding as "deferred"
+
+### 8f. Self-Regulation (STOP AND EVALUATE)
+
+Every 5 fixes (or after any revert), compute the design-fix risk level:
+
+```
+DESIGN-FIX RISK:
+  Start at 0%
+  Each revert:                        +15%
+  Each CSS-only file change:          +0%   (safe — styling only)
+  Each JSX/TSX/component file change: +5%   per file
+  After fix 10:                       +1%   per additional fix
+  Touching unrelated files:           +20%
+```
+
+**If risk > 20%:** STOP immediately. Show the user what you've done so far. Ask whether to continue.
+
+**Hard cap: 30 fixes.** After 30 fixes, stop regardless of remaining findings.
+
+---
+
+## Phase 9: Final Design Audit
+
+After all fixes are applied:
+
+1. Re-run the design audit on all affected pages
+2. Compute final design score and AI slop score
+3. **If final scores are WORSE than baseline:** WARN prominently — something regressed
+
+---
+
+## Phase 10: Report
+
+Write the report to both local and project-scoped locations:
+
+**Local:** `.gstack/design-reports/design-audit-{domain}-{YYYY-MM-DD}.md`
+
+**Project-scoped:**
+```bash
+SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+mkdir -p ~/.gstack/projects/$SLUG
+```
+Write to `~/.gstack/projects/{slug}/{user}-{branch}-design-audit-{datetime}.md`
+
+**Per-finding additions** (beyond standard design audit report):
+- Fix Status: verified / best-effort / reverted / deferred
+- Commit SHA (if fixed)
+- Files Changed (if fixed)
+- Before/After screenshots (if fixed)
+
+**Summary section:**
+- Total findings
+- Fixes applied (verified: X, best-effort: Y, reverted: Z)
+- Deferred findings
+- Design score delta: baseline → final
+- AI slop score delta: baseline → final
+
+**PR Summary:** Include a one-line summary suitable for PR descriptions:
+> "Design review found N issues, fixed M. Design score X → Y, AI slop score X → Y."
+
+---
+
+## Phase 11: TODOS.md Update
+
+If the repo has a `TODOS.md`:
+
+1. **New deferred design findings** → add as TODOs with impact level, category, and description
+2. **Fixed findings that were in TODOS.md** → annotate with "Fixed by /qa-design-review on {branch}, {date}"
+
+---
+
+## Additional Rules (qa-design-review specific)
+
+11. **Clean working tree required.** Refuse to start if `git status --porcelain` is non-empty.
+12. **One commit per fix.** Never bundle multiple design fixes into one commit.
+13. **Never modify tests or CI configuration.** Only fix application source code and styles.
+14. **Revert on regression.** If a fix makes things worse, `git revert HEAD` immediately.
+15. **Self-regulate.** Follow the design-fix risk heuristic. When in doubt, stop and ask.
+16. **CSS-first.** Prefer CSS/styling changes over structural component changes. CSS-only changes are safer and more reversible.
+17. **DESIGN.md export.** You MAY write a DESIGN.md file if the user accepts the offer from Phase 2.
diff --git a/scripts/gen-skill-docs.ts b/scripts/gen-skill-docs.ts
index ebe4f54f..7a0b85ab 100644
--- a/scripts/gen-skill-docs.ts
+++ b/scripts/gen-skill-docs.ts
@@ -479,6 +479,339 @@ Minimum 0 per category.
 10. **Use \`snapshot -C\` for tricky UIs.** Finds clickable divs that the accessibility tree misses.`;
 }
 
+function generateDesignMethodology(): string {
+  return `## Modes
+
+### Full (default)
+Systematic review of all pages reachable from homepage. Visit 5-8 pages. Full checklist evaluation, responsive screenshots, interaction flow testing. Produces complete design audit report with letter grades.
+
+### Quick (\`--quick\`)
+Homepage + 2 key pages only. First Impression + Design System Extraction + abbreviated checklist. Fastest path to a design score.
+
+### Deep (\`--deep\`)
+Comprehensive review: 10-15 pages, every interaction flow, exhaustive checklist. For pre-launch audits or major redesigns.
+
+### Diff-aware (automatic when on a feature branch with no URL)
+When on a feature branch, scope to pages affected by the branch changes:
+1. Analyze the branch diff: \`git diff main...HEAD --name-only\`
+2. Map changed files to affected pages/routes
+3. Detect running app on common local ports (3000, 4000, 8080)
+4. Audit only affected pages, compare design quality before/after
+
+### Regression (\`--regression\` or previous \`design-baseline.json\` found)
+Run full audit, then load previous \`design-baseline.json\`. Compare: per-category grade deltas, new findings, resolved findings. Output regression table in report.
+
+---
+
+## Phase 1: First Impression
+
+The most uniquely designer-like output. Form a gut reaction before analyzing anything.
+
+1. Navigate to the target URL
+2. Take a full-page desktop screenshot: \`$B screenshot "$REPORT_DIR/screenshots/first-impression.png"\`
+3. Write the **First Impression** using this structured critique format:
+   - "The site communicates **[what]**." (what it says at a glance — competence? playfulness? confusion?)
+   - "I notice **[observation]**." (what stands out, positive or negative — be specific)
+   - "The first 3 things my eye goes to are: **[1]**, **[2]**, **[3]**." (hierarchy check — are these intentional?)
+   - "If I had to describe this in one word: **[word]**." (gut verdict)
+
+This is the section users read first. Be opinionated. A designer doesn't hedge — they react.
+
+---
+
+## Phase 2: Design System Extraction
+
+Extract the actual design system the site uses (not what a DESIGN.md says, but what's rendered):
+
+\`\`\`bash
+# Fonts in use (capped at 500 elements to avoid timeout)
+$B js "JSON.stringify([...new Set([...document.querySelectorAll('*')].slice(0,500).map(e => getComputedStyle(e).fontFamily))])"
+
+# Color palette in use
+$B js "JSON.stringify([...new Set([...document.querySelectorAll('*')].slice(0,500).flatMap(e => [getComputedStyle(e).color, getComputedStyle(e).backgroundColor]).filter(c => c !== 'rgba(0, 0, 0, 0)'))])"
+
+# Heading hierarchy
+$B js "JSON.stringify([...document.querySelectorAll('h1,h2,h3,h4,h5,h6')].map(h => ({tag:h.tagName, text:h.textContent.trim().slice(0,50), size:getComputedStyle(h).fontSize, weight:getComputedStyle(h).fontWeight})))"
+
+# Touch target audit (find undersized interactive elements)
+$B js "JSON.stringify([...document.querySelectorAll('a,button,input,[role=button]')].filter(e => {const r=e.getBoundingClientRect(); return r.width>0 && (r.width<44||r.height<44)}).map(e => ({tag:e.tagName, text:(e.textContent||'').trim().slice(0,30), w:Math.round(e.getBoundingClientRect().width), h:Math.round(e.getBoundingClientRect().height)})).slice(0,20))"
+
+# Performance baseline
+$B perf
+\`\`\`
+
+Structure findings as an **Inferred Design System**:
+- **Fonts:** list with usage counts. Flag if >3 distinct font families.
+- **Colors:** palette extracted. Flag if >12 unique non-gray colors. Note warm/cool/mixed.
+- **Heading Scale:** h1-h6 sizes. Flag skipped levels, non-systematic size jumps.
+- **Spacing Patterns:** sample padding/margin values. Flag non-scale values.
+
+After extraction, offer: *"Want me to save this as your DESIGN.md? I can lock in these observations as your project's design system baseline."*
+
+---
+
+## Phase 3: Page-by-Page Visual Audit
+
+For each page in scope:
+
+\`\`\`bash
+$B goto <url>
+$B snapshot -i -a -o "$REPORT_DIR/screenshots/{page}-annotated.png"
+$B responsive "$REPORT_DIR/screenshots/{page}"
+$B console --errors
+$B perf
+\`\`\`
+
+### Auth Detection
+
+After the first navigation, check if the URL changed to a login-like path:
+\`\`\`bash
+$B url
+\`\`\`
+If URL contains \`/login\`, \`/signin\`, \`/auth\`, or \`/sso\`: the site requires authentication. AskUserQuestion: "This site requires authentication. Want to import cookies from your browser? Run \`/setup-browser-cookies\` first if needed."
+
+### Design Audit Checklist (10 categories, ~80 items)
+
+Apply these at each page. Each finding gets an impact rating (high/medium/polish) and category.
+
+**1. Visual Hierarchy & Composition** (8 items)
+- Clear focal point? One primary CTA per view?
+- Eye flows naturally top-left to bottom-right?
+- Visual noise — competing elements fighting for attention?
+- Information density appropriate for content type?
+- Z-index clarity — nothing unexpectedly overlapping?
+- Above-the-fold content communicates purpose in 3 seconds?
+- Squint test: hierarchy still visible when blurred?
+- White space is intentional, not leftover?
+
+**2. Typography** (15 items)
+- Font count <=3 (flag if more)
+- Scale follows ratio (1.25 major third or 1.333 perfect fourth)
+- Line-height: 1.5x body, 1.15-1.25x headings
+- Measure: 45-75 chars per line (66 ideal)
+- Heading hierarchy: no skipped levels (h1→h3 without h2)
+- Weight contrast: >=2 weights used for hierarchy
+- No blacklisted fonts (Papyrus, Comic Sans, Lobster, Impact, Jokerman)
+- If primary font is Inter/Roboto/Open Sans/Poppins → flag as potentially generic
+- \`text-wrap: balance\` or \`text-pretty\` on headings (check via \`$B css <heading> text-wrap\`)
+- Curly quotes used, not straight quotes
+- Ellipsis character (\`…\`) not three dots (\`...\`)
+- \`font-variant-numeric: tabular-nums\` on number columns
+- Body text >= 16px
+- Caption/label >= 12px
+- No letterspacing on lowercase text
+
+**3. Color & Contrast** (10 items)
+- Palette coherent (<=12 unique non-gray colors)
+- WCAG AA: body text 4.5:1, large text (18px+) 3:1, UI components 3:1
+- Semantic colors consistent (success=green, error=red, warning=yellow/amber)
+- No color-only encoding (always add labels, icons, or patterns)
+- Dark mode: surfaces use elevation, not just lightness inversion
+- Dark mode: text off-white (~#E0E0E0), not pure white
+- Primary accent desaturated 10-20% in dark mode
+- \`color-scheme: dark\` on html element (if dark mode present)
+- No red/green only combinations (8% of men have red-green deficiency)
+- Neutral palette is warm or cool consistently — not mixed
+
+**4. Spacing & Layout** (12 items)
+- Grid consistent at all breakpoints
+- Spacing uses a scale (4px or 8px base), not arbitrary values
+- Alignment is consistent — nothing floats outside the grid
+- Rhythm: related items closer together, distinct sections further apart
+- Border-radius hierarchy (not uniform bubbly radius on everything)
+- Inner radius = outer radius - gap (nested elements)
+- No horizontal scroll on mobile
+- Max content width set (no full-bleed body text)
+- \`env(safe-area-inset-*)\` for notch devices
+- URL reflects state (filters, tabs, pagination in query params)
+- Flex/grid used for layout (not JS measurement)
+- Breakpoints: mobile (375), tablet (768), desktop (1024), wide (1440)
+
+**5. Interaction States** (10 items)
+- Hover state on all interactive elements
+- \`focus-visible\` ring present (never \`outline: none\` without replacement)
+- Active/pressed state with depth effect or color shift
+- Disabled state: reduced opacity + \`cursor: not-allowed\`
+- Loading: skeleton shapes match real content layout
+- Empty states: warm message + primary action + visual (not just "No items.")
+- Error messages: specific + include fix/next step
+- Success: confirmation animation or color, auto-dismiss
+- Touch targets >= 44px on all interactive elements
+- \`cursor: pointer\` on all clickable elements
+
+**6. Responsive Design** (8 items)
+- Mobile layout makes *design* sense (not just stacked desktop columns)
+- Touch targets sufficient on mobile (>= 44px)
+- No horizontal scroll on any viewport
+- Images handle responsive (srcset, sizes, or CSS containment)
+- Text readable without zooming on mobile (>= 16px body)
+- Navigation collapses appropriately (hamburger, bottom nav, etc.)
+- Forms usable on mobile (correct input types, no autoFocus on mobile)
+- No \`user-scalable=no\` or \`maximum-scale=1\` in viewport meta
+
+**7. Motion & Animation** (6 items)
+- Easing: ease-out for entering, ease-in for exiting, ease-in-out for moving
+- Duration: 50-700ms range (nothing slower unless page transition)
+- Purpose: every animation communicates something (state change, attention, spatial relationship)
+- \`prefers-reduced-motion\` respected (check: \`$B js "matchMedia('(prefers-reduced-motion: reduce)').matches"\`)
+- No \`transition: all\` — properties listed explicitly
+- Only \`transform\` and \`opacity\` animated (not layout properties like width, height, top, left)
+
+**8. Content & Microcopy** (8 items)
+- Empty states designed with warmth (message + action + illustration/icon)
+- Error messages specific: what happened + why + what to do next
+- Button labels specific ("Save API Key" not "Continue" or "Submit")
+- No placeholder/lorem ipsum text visible in production
+- Truncation handled (\`text-overflow: ellipsis\`, \`line-clamp\`, or \`break-words\`)
+- Active voice ("Install the CLI" not "The CLI will be installed")
+- Loading states end with \`…\` ("Saving…" not "Saving...")
+- Destructive actions have confirmation modal or undo window
+
+**9. AI Slop Detection** (10 anti-patterns — the blacklist)
+
+The test: would a human designer at a respected studio ever ship this?
+
+- Purple/violet/indigo gradient backgrounds or blue-to-purple color schemes
+- **The 3-column feature grid:** icon-in-colored-circle + bold title + 2-line description, repeated 3x symmetrically. THE most recognizable AI layout.
+- Icons in colored circles as section decoration (SaaS starter template look)
+- Centered everything (\`text-align: center\` on all headings, descriptions, cards)
+- Uniform bubbly border-radius on every element (same large radius on everything)
+- Decorative blobs, floating circles, wavy SVG dividers (if a section feels empty, it needs better content, not decoration)
+- Emoji as design elements (rockets in headings, emoji as bullet points)
+- Colored left-border on cards (\`border-left: 3px solid <accent>\`)
+- Generic hero copy ("Welcome to [X]", "Unlock the power of...", "Your all-in-one solution for...")
+- Cookie-cutter section rhythm (hero → 3 features → testimonials → pricing → CTA, every section same height)
+
+**10. Performance as Design** (6 items)
+- LCP < 2.0s (web apps), < 1.5s (informational sites)
+- CLS < 0.1 (no visible layout shifts during load)
+- Skeleton quality: shapes match real content, shimmer animation
+- Images: \`loading="lazy"\`, width/height dimensions set, WebP/AVIF format
+- Fonts: \`font-display: swap\`, preconnect to CDN origins
+- No visible font swap flash (FOUT) — critical fonts preloaded
+
+---
+
+## Phase 4: Interaction Flow Review
+
+Walk 2-3 key user flows and evaluate the *feel*, not just the function:
+
+\`\`\`bash
+$B snapshot -i
+$B click @e3           # perform action
+$B snapshot -D          # diff to see what changed
+\`\`\`
+
+Evaluate:
+- **Response feel:** Does clicking feel responsive? Any delays or missing loading states?
+- **Transition quality:** Are transitions intentional or generic/absent?
+- **Feedback clarity:** Did the action clearly succeed or fail? Is the feedback immediate?
+- **Form polish:** Focus states visible? Validation timing correct? Errors near the source?
+
+---
+
+## Phase 5: Cross-Page Consistency
+
+Compare screenshots and observations across pages for:
+- Navigation bar consistent across all pages?
+- Footer consistent?
+- Component reuse vs one-off designs (same button styled differently on different pages?)
+- Tone consistency (one page playful while another is corporate?)
+- Spacing rhythm carries across pages?
+
+---
+
+## Phase 6: Compile Report
+
+### Output Locations
+
+**Local:** \`.gstack/design-reports/design-audit-{domain}-{YYYY-MM-DD}.md\`
+
+**Project-scoped:**
+\`\`\`bash
+SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\\([^/]*/[^/]*\\)\\.git$|\\1|;s|.*[:/]\\([^/]*/[^/]*\\)$|\\1|' | tr '/' '-')
+mkdir -p ~/.gstack/projects/$SLUG
+\`\`\`
+Write to: \`~/.gstack/projects/{slug}/{user}-{branch}-design-audit-{datetime}.md\`
+
+**Baseline:** Write \`design-baseline.json\` for regression mode:
+\`\`\`json
+{
+  "date": "YYYY-MM-DD",
+  "url": "<target>",
+  "designScore": "B",
+  "aiSlopScore": "C",
+  "categoryGrades": { "hierarchy": "A", "typography": "B", ... },
+  "findings": [{ "id": "FINDING-001", "title": "...", "impact": "high", "category": "typography" }]
+}
+\`\`\`
+
+### Scoring System
+
+**Dual headline scores:**
+- **Design Score: {A-F}** — weighted average of all 10 categories
+- **AI Slop Score: {A-F}** — standalone grade with pithy verdict
+
+**Per-category grades:**
+- **A:** Intentional, polished, delightful. Shows design thinking.
+- **B:** Solid fundamentals, minor inconsistencies. Looks professional.
+- **C:** Functional but generic. No major problems, no design point of view.
+- **D:** Noticeable problems. Feels unfinished or careless.
+- **F:** Actively hurting user experience. Needs significant rework.
+
+**Grade computation:** Each category starts at A. Each High-impact finding drops one letter grade. Each Medium-impact finding drops half a letter grade. Polish findings are noted but do not affect grade. Minimum is F.
+
+**Category weights for Design Score:**
+| Category | Weight |
+|----------|--------|
+| Visual Hierarchy | 15% |
+| Typography | 15% |
+| Spacing & Layout | 15% |
+| Color & Contrast | 10% |
+| Interaction States | 10% |
+| Responsive | 10% |
+| Content Quality | 10% |
+| AI Slop | 5% |
+| Motion | 5% |
+| Performance Feel | 5% |
+
+AI Slop is 5% of Design Score but also graded independently as a headline metric.
+
+### Regression Output
+
+When previous \`design-baseline.json\` exists or \`--regression\` flag is used:
+- Load baseline grades
+- Compare: per-category deltas, new findings, resolved findings
+- Append regression table to report
+
+---
+
+## Design Critique Format
+
+Use structured feedback, not opinions:
+- "I notice..." — observation (e.g., "I notice the primary CTA competes with the secondary action")
+- "I wonder..." — question (e.g., "I wonder if users will understand what 'Process' means here")
+- "What if..." — suggestion (e.g., "What if we moved search to a more prominent position?")
+- "I think... because..." — reasoned opinion (e.g., "I think the spacing between sections is too uniform because it doesn't create hierarchy")
+
+Tie everything to user goals and product objectives. Always suggest specific improvements alongside problems.
+
+---
+
+## Important Rules
+
+1. **Think like a designer, not a QA engineer.** You care whether things feel right, look intentional, and respect the user. You do NOT just care whether things "work."
+2. **Screenshots are evidence.** Every finding needs at least one screenshot. Use annotated screenshots (\`snapshot -a\`) to highlight elements.
+3. **Be specific and actionable.** "Change X to Y because Z" — not "the spacing feels off."
+4. **Never read source code.** Evaluate the rendered site, not the implementation. (Exception: offer to write DESIGN.md from extracted observations.)
+5. **AI Slop detection is your superpower.** Most developers can't evaluate whether their site looks AI-generated. You can. Be direct about it.
+6. **Quick wins matter.** Always include a "Quick Wins" section — the 3-5 highest-impact fixes that take <30 minutes each.
+7. **Use \`snapshot -C\` for tricky UIs.** Finds clickable divs that the accessibility tree misses.
+8. **Responsive is design, not just "not broken."** A stacked desktop layout on mobile is not responsive design — it's lazy. Evaluate whether the mobile layout makes *design* sense.
+9. **Document incrementally.** Write each finding to the report as you find it. Don't batch.
+10. **Depth over breadth.** 5-10 well-documented findings with screenshots and specific suggestions > 20 vague observations.`;
+}
+
 const RESOLVERS: Record<string, () => string> = {
   COMMAND_REFERENCE: generateCommandReference,
   SNAPSHOT_FLAGS: generateSnapshotFlags,
@@ -486,6 +819,7 @@ const RESOLVERS: Record<string, () => string> = {
   BROWSE_SETUP: generateBrowseSetup,
   BASE_BRANCH_DETECT: generateBaseBranchDetect,
   QA_METHODOLOGY: generateQAMethodology,
+  DESIGN_METHODOLOGY: generateDesignMethodology,
 };
 
 // ─── Template Processing ────────────────────────────────────
@@ -539,6 +873,9 @@ function findTemplates(): string[] {
     path.join(ROOT, 'plan-eng-review', 'SKILL.md.tmpl'),
     path.join(ROOT, 'retro', 'SKILL.md.tmpl'),
     path.join(ROOT, 'gstack-upgrade', 'SKILL.md.tmpl'),
+    path.join(ROOT, 'plan-design-review', 'SKILL.md.tmpl'),
+    path.join(ROOT, 'qa-design-review', 'SKILL.md.tmpl'),
+    path.join(ROOT, 'design-consultation', 'SKILL.md.tmpl'),
     path.join(ROOT, 'document-release', 'SKILL.md.tmpl'),
   ];
   for (const p of candidates) {
diff --git a/scripts/skill-check.ts b/scripts/skill-check.ts
index 51a583a2..97c417ef 100644
--- a/scripts/skill-check.ts
+++ b/scripts/skill-check.ts
@@ -27,6 +27,8 @@ const SKILL_FILES = [
   'plan-ceo-review/SKILL.md',
   'plan-eng-review/SKILL.md',
   'setup-browser-cookies/SKILL.md',
+  'plan-design-review/SKILL.md',
+  'qa-design-review/SKILL.md',
   'gstack-upgrade/SKILL.md',
   'document-release/SKILL.md',
 ].filter(f => fs.existsSync(path.join(ROOT, f)));
diff --git a/test/gen-skill-docs.test.ts b/test/gen-skill-docs.test.ts
index 7ec8b280..def042c9 100644
--- a/test/gen-skill-docs.test.ts
+++ b/test/gen-skill-docs.test.ts
@@ -69,6 +69,9 @@ describe('gen-skill-docs', () => {
     { dir: 'retro', name: 'retro' },
     { dir: 'setup-browser-cookies', name: 'setup-browser-cookies' },
     { dir: 'gstack-upgrade', name: 'gstack-upgrade' },
+    { dir: 'plan-design-review', name: 'plan-design-review' },
+    { dir: 'qa-design-review', name: 'qa-design-review' },
+    { dir: 'design-consultation', name: 'design-consultation' },
   ];
 
   test('every skill has a SKILL.md.tmpl template', () => {
diff --git a/test/skill-e2e.test.ts b/test/skill-e2e.test.ts
index 37b42de8..4378c322 100644
--- a/test/skill-e2e.test.ts
+++ b/test/skill-e2e.test.ts
@@ -1663,6 +1663,558 @@ describeE2E('Deferred skill E2E', () => {
   test.todo('/gstack-upgrade completes upgrade flow');
 });
 
+// --- Design Consultation E2E ---
+
+/**
+ * LLM judge for DESIGN.md quality — checks font blacklist compliance,
+ * coherence, specificity, and AI slop avoidance.
+ */
+async function designQualityJudge(designMd: string): Promise<{ passed: boolean; reasoning: string }> {
+  return callJudge<{ passed: boolean; reasoning: string }>(`You are evaluating a generated DESIGN.md file for quality.
+
+Evaluate against these criteria — ALL must pass for an overall "passed: true":
+1. Does NOT recommend Inter, Roboto, Arial, Helvetica, Open Sans, Lato, Montserrat, or Poppins as primary fonts
+2. Aesthetic direction is coherent with color approach (e.g., brutalist aesthetic doesn't pair with expressive color without explanation)
+3. Font recommendations include specific font names (not generic like "a sans-serif font")
+4. Color palette includes actual hex values, not placeholders like "[hex]"
+5. Rationale is provided for major decisions (not just "because it looks good")
+6. No AI slop patterns: purple gradients mentioned positively, "3-column feature grid" language, generic marketing speak
+7. Product context is reflected in design choices (civic tech → should have appropriate, professional aesthetic)
+
+DESIGN.md content:
+\`\`\`
+${designMd}
+\`\`\`
+
+Return JSON: { "passed": true/false, "reasoning": "one paragraph explaining your evaluation" }`);
+}
+
+describeE2E('Design Consultation E2E', () => {
+  let designDir: string;
+
+  beforeAll(() => {
+    designDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-design-consultation-'));
+    const { spawnSync } = require('child_process');
+    const run = (cmd: string, args: string[]) =>
+      spawnSync(cmd, args, { cwd: designDir, stdio: 'pipe', timeout: 5000 });
+
+    run('git', ['init']);
+    run('git', ['config', 'user.email', 'test@test.com']);
+    run('git', ['config', 'user.name', 'Test']);
+
+    // Create a realistic project context
+    fs.writeFileSync(path.join(designDir, 'README.md'), `# CivicPulse
+
+A civic tech data platform for government employees to access, visualize, and share public data. Built with Next.js and PostgreSQL.
+
+## Features
+- Real-time data dashboards for municipal budgets
+- Public records search with faceted filtering
+- Data export and sharing tools for inter-department collaboration
+`);
+    fs.writeFileSync(path.join(designDir, 'package.json'), JSON.stringify({
+      name: 'civicpulse',
+      version: '0.1.0',
+      dependencies: { next: '^14.0.0', react: '^18.2.0', 'tailwindcss': '^3.4.0' },
+    }, null, 2));
+
+    run('git', ['add', '.']);
+    run('git', ['commit', '-m', 'initial project setup']);
+
+    // Copy design-consultation skill
+    fs.mkdirSync(path.join(designDir, 'design-consultation'), { recursive: true });
+    fs.copyFileSync(
+      path.join(ROOT, 'design-consultation', 'SKILL.md'),
+      path.join(designDir, 'design-consultation', 'SKILL.md'),
+    );
+  });
+
+  afterAll(() => {
+    try { fs.rmSync(designDir, { recursive: true, force: true }); } catch {}
+  });
+
+  test('Test 1: core flow produces valid DESIGN.md + CLAUDE.md', async () => {
+    const result = await runSkillTest({
+      prompt: `Read design-consultation/SKILL.md for the design consultation workflow.
+
+This is a civic tech data platform called CivicPulse for government employees who need to access public data. Read the README.md for details.
+
+Skip research — work from your design knowledge. Skip the font preview page. Skip any AskUserQuestion calls — this is non-interactive. Accept your first design system proposal.
+
+Write DESIGN.md and CLAUDE.md (or update it) in the working directory.`,
+      workingDirectory: designDir,
+      maxTurns: 20,
+      timeout: 360_000,
+      testName: 'design-consultation-core',
+      runId,
+    });
+
+    logCost('/design-consultation core', result);
+
+    const designPath = path.join(designDir, 'DESIGN.md');
+    const claudePath = path.join(designDir, 'CLAUDE.md');
+    const designExists = fs.existsSync(designPath);
+    const claudeExists = fs.existsSync(claudePath);
+    let designContent = '';
+
+    if (designExists) {
+      designContent = fs.readFileSync(designPath, 'utf-8');
+    }
+
+    // Structural checks
+    const requiredSections = ['Product Context', 'Aesthetic', 'Typography', 'Color', 'Spacing', 'Layout', 'Motion'];
+    const missingSections = requiredSections.filter(s => !designContent.toLowerCase().includes(s.toLowerCase()));
+
+    // LLM judge for quality
+    let judgeResult = { passed: false, reasoning: 'judge not run' };
+    if (designExists && designContent.length > 100) {
+      try {
+        judgeResult = await designQualityJudge(designContent);
+        console.log('Design quality judge:', JSON.stringify(judgeResult, null, 2));
+      } catch (err) {
+        console.warn('Judge failed:', err);
+        judgeResult = { passed: true, reasoning: 'judge error — defaulting to pass' };
+      }
+    }
+
+    const structuralPass = designExists && claudeExists && missingSections.length === 0;
+    recordE2E('/design-consultation core', 'Design Consultation E2E', result, {
+      passed: structuralPass && judgeResult.passed && ['success', 'error_max_turns'].includes(result.exitReason),
+    });
+
+    expect(['success', 'error_max_turns']).toContain(result.exitReason);
+    expect(designExists).toBe(true);
+    if (designExists) {
+      expect(missingSections).toHaveLength(0);
+    }
+    if (claudeExists) {
+      const claude = fs.readFileSync(claudePath, 'utf-8');
+      expect(claude.toLowerCase()).toContain('design.md');
+    }
+  }, 420_000);
+
+  test('Test 2: research integration uses WebSearch', async () => {
+    // Clean up from previous test
+    try { fs.unlinkSync(path.join(designDir, 'DESIGN.md')); } catch {}
+    try { fs.unlinkSync(path.join(designDir, 'CLAUDE.md')); } catch {}
+
+    const result = await runSkillTest({
+      prompt: `Read design-consultation/SKILL.md for the design consultation workflow.
+
+This is a civic tech data platform called CivicPulse. Read the README.md.
+
+DO research competitors before proposing — search for civic tech and government data platform designs. Skip the font preview page. Skip any AskUserQuestion calls — this is non-interactive.
+
+Write DESIGN.md to the working directory.`,
+      workingDirectory: designDir,
+      maxTurns: 30,
+      timeout: 360_000,
+      testName: 'design-consultation-research',
+      runId,
+    });
+
+    logCost('/design-consultation research', result);
+
+    const designPath = path.join(designDir, 'DESIGN.md');
+    const designExists = fs.existsSync(designPath);
+    let designContent = '';
+    if (designExists) {
+      designContent = fs.readFileSync(designPath, 'utf-8');
+    }
+
+    // Check if WebSearch was used (may not be available in all envs)
+    const webSearchCalls = result.toolCalls.filter(tc => tc.tool === 'WebSearch');
+    if (webSearchCalls.length > 0) {
+      console.log(`WebSearch used ${webSearchCalls.length} times`);
+    } else {
+      console.warn('WebSearch not used — may be unavailable in test env');
+    }
+
+    // LLM judge
+    let judgeResult = { passed: false, reasoning: 'judge not run' };
+    if (designExists && designContent.length > 100) {
+      try {
+        judgeResult = await designQualityJudge(designContent);
+        console.log('Design quality judge (research):', JSON.stringify(judgeResult, null, 2));
+      } catch (err) {
+        console.warn('Judge failed:', err);
+        judgeResult = { passed: true, reasoning: 'judge error — defaulting to pass' };
+      }
+    }
+
+    recordE2E('/design-consultation research', 'Design Consultation E2E', result, {
+      passed: designExists && ['success', 'error_max_turns'].includes(result.exitReason),
+    });
+
+    expect(['success', 'error_max_turns']).toContain(result.exitReason);
+    expect(designExists).toBe(true);
+  }, 420_000);
+
+  test('Test 3: handles existing DESIGN.md', async () => {
+    // Pre-create a minimal DESIGN.md
+    fs.writeFileSync(path.join(designDir, 'DESIGN.md'), `# Design System — CivicPulse
+
+## Typography
+Body: system-ui
+`);
+
+    const result = await runSkillTest({
+      prompt: `Read design-consultation/SKILL.md for the design consultation workflow.
+
+There is already a DESIGN.md in this repo. Update it with a complete design system for CivicPulse, a civic tech data platform for government employees.
+
+Skip research. Skip font preview. Skip any AskUserQuestion calls — this is non-interactive.`,
+      workingDirectory: designDir,
+      maxTurns: 20,
+      timeout: 360_000,
+      testName: 'design-consultation-existing',
+      runId,
+    });
+
+    logCost('/design-consultation existing', result);
+
+    const designPath = path.join(designDir, 'DESIGN.md');
+    const designExists = fs.existsSync(designPath);
+    let designContent = '';
+    if (designExists) {
+      designContent = fs.readFileSync(designPath, 'utf-8');
+    }
+
+    // Should have more content than the minimal version
+    const hasColor = designContent.toLowerCase().includes('color');
+    const hasSpacing = designContent.toLowerCase().includes('spacing');
+
+    recordE2E('/design-consultation existing', 'Design Consultation E2E', result, {
+      passed: designExists && hasColor && hasSpacing && ['success', 'error_max_turns'].includes(result.exitReason),
+    });
+
+    expect(['success', 'error_max_turns']).toContain(result.exitReason);
+    expect(designExists).toBe(true);
+    if (designExists) {
+      expect(hasColor).toBe(true);
+      expect(hasSpacing).toBe(true);
+    }
+  }, 420_000);
+
+  test('Test 4: generates font + color preview HTML', async () => {
+    // Clean up
+    try { fs.unlinkSync(path.join(designDir, 'DESIGN.md')); } catch {}
+
+    const result = await runSkillTest({
+      prompt: `Read design-consultation/SKILL.md for the design consultation workflow.
+
+This is CivicPulse, a civic tech data platform. Read the README.md.
+
+Skip research. Skip any AskUserQuestion calls — this is non-interactive. Generate the font and color preview page but write it to ./design-preview.html instead of /tmp/ (do NOT run the open command). Then write DESIGN.md.`,
+      workingDirectory: designDir,
+      maxTurns: 20,
+      timeout: 360_000,
+      testName: 'design-consultation-preview',
+      runId,
+    });
+
+    logCost('/design-consultation preview', result);
+
+    const previewPath = path.join(designDir, 'design-preview.html');
+    const designPath = path.join(designDir, 'DESIGN.md');
+    const previewExists = fs.existsSync(previewPath);
+    const designExists = fs.existsSync(designPath);
+
+    let previewContent = '';
+    if (previewExists) {
+      previewContent = fs.readFileSync(previewPath, 'utf-8');
+    }
+
+    const hasHtml = previewContent.includes('<html') || previewContent.includes('<!DOCTYPE');
+    const hasFontRef = previewContent.includes('font-family') || previewContent.includes('fonts.googleapis') || previewContent.includes('fonts.bunny');
+    const hasColorRef = previewContent.includes('#') && (previewContent.includes('background') || previewContent.includes('color:'));
+
+    // LLM judge on the DESIGN.md
+    let judgeResult = { passed: false, reasoning: 'judge not run' };
+    if (designExists) {
+      const designContent = fs.readFileSync(designPath, 'utf-8');
+      if (designContent.length > 100) {
+        try {
+          judgeResult = await designQualityJudge(designContent);
+          console.log('Design quality judge (preview):', JSON.stringify(judgeResult, null, 2));
+        } catch (err) {
+          console.warn('Judge failed:', err);
+          judgeResult = { passed: true, reasoning: 'judge error — defaulting to pass' };
+        }
+      }
+    }
+
+    recordE2E('/design-consultation preview', 'Design Consultation E2E', result, {
+      passed: previewExists && designExists && hasHtml && ['success', 'error_max_turns'].includes(result.exitReason),
+    });
+
+    expect(['success', 'error_max_turns']).toContain(result.exitReason);
+    expect(previewExists).toBe(true);
+    if (previewExists) {
+      expect(hasHtml).toBe(true);
+      expect(hasFontRef).toBe(true);
+    }
+    expect(designExists).toBe(true);
+  }, 420_000);
+});
+
+// --- Plan Design Review E2E ---
+
+describeE2E('Plan Design Review E2E', () => {
+  let reviewDir: string;
+
+  beforeAll(() => {
+    testServer = testServer || startTestServer();
+    reviewDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-plan-design-'));
+    setupBrowseShims(reviewDir);
+
+    const { spawnSync } = require('child_process');
+    const run = (cmd: string, args: string[]) =>
+      spawnSync(cmd, args, { cwd: reviewDir, stdio: 'pipe', timeout: 5000 });
+
+    run('git', ['init']);
+    run('git', ['config', 'user.email', 'test@test.com']);
+    run('git', ['config', 'user.name', 'Test']);
+    fs.writeFileSync(path.join(reviewDir, 'index.html'), '<h1>Test</h1>\n');
+    run('git', ['add', '.']);
+    run('git', ['commit', '-m', 'initial']);
+
+    // Copy plan-design-review skill
+    fs.mkdirSync(path.join(reviewDir, 'plan-design-review'), { recursive: true });
+    fs.copyFileSync(
+      path.join(ROOT, 'plan-design-review', 'SKILL.md'),
+      path.join(reviewDir, 'plan-design-review', 'SKILL.md'),
+    );
+  });
+
+  afterAll(() => {
+    try { fs.rmSync(reviewDir, { recursive: true, force: true }); } catch {}
+  });
+
+  test('Test 5: /plan-design-review produces audit report', async () => {
+    const result = await runSkillTest({
+      prompt: `IMPORTANT: The browse binary is already assigned below as B. Do NOT search for it or run the SKILL.md setup block — just use $B directly.
+
+B="${browseBin}"
+
+Read plan-design-review/SKILL.md for the design review workflow.
+
+Review the site at ${testServer.url}. Use --quick mode (homepage + 2 pages). Skip any AskUserQuestion calls — this is non-interactive. Write your audit report to ./design-audit.md. Do not offer to create DESIGN.md.`,
+      workingDirectory: reviewDir,
+      maxTurns: 20,
+      timeout: 360_000,
+      testName: 'plan-design-review-audit',
+      runId,
+    });
+
+    logCost('/plan-design-review audit', result);
+
+    const reportPath = path.join(reviewDir, 'design-audit.md');
+    const reportExists = fs.existsSync(reportPath);
+    let reportContent = '';
+    if (reportExists) {
+      reportContent = fs.readFileSync(reportPath, 'utf-8');
+    }
+
+    const hasFirstImpression = reportContent.toLowerCase().includes('first impression') ||
+      reportContent.toLowerCase().includes('impression');
+
+    recordE2E('/plan-design-review audit', 'Plan Design Review E2E', result, {
+      passed: reportExists && ['success', 'error_max_turns'].includes(result.exitReason),
+    });
+
+    expect(['success', 'error_max_turns']).toContain(result.exitReason);
+    expect(reportExists).toBe(true);
+    if (reportExists) {
+      expect(reportContent.length).toBeGreaterThan(200);
+    }
+  }, 420_000);
+
+  test('Test 6: /plan-design-review exports DESIGN.md', async () => {
+    // Clean up previous test artifacts
+    try { fs.unlinkSync(path.join(reviewDir, 'design-audit.md')); } catch {}
+
+    const result = await runSkillTest({
+      prompt: `IMPORTANT: The browse binary is already assigned below as B. Do NOT search for it or run the SKILL.md setup block — just use $B directly.
+
+B="${browseBin}"
+
+Read plan-design-review/SKILL.md for the design review workflow.
+
+Review ${testServer.url} with --quick mode. Skip any AskUserQuestion calls — this is non-interactive. After Phase 2 (Design System Extraction), write a DESIGN.md to the working directory. Also write the audit report to ./design-audit.md.`,
+      workingDirectory: reviewDir,
+      maxTurns: 25,
+      timeout: 360_000,
+      testName: 'plan-design-review-export',
+      runId,
+    });
+
+    logCost('/plan-design-review export', result);
+
+    const designPath = path.join(reviewDir, 'DESIGN.md');
+    const reportPath = path.join(reviewDir, 'design-audit.md');
+    const designExists = fs.existsSync(designPath);
+    const reportExists = fs.existsSync(reportPath);
+
+    let designContent = '';
+    if (designExists) {
+      designContent = fs.readFileSync(designPath, 'utf-8');
+    }
+
+    const hasTypography = designContent.toLowerCase().includes('typography') || designContent.toLowerCase().includes('font');
+    const hasColor = designContent.toLowerCase().includes('color');
+
+    recordE2E('/plan-design-review export', 'Plan Design Review E2E', result, {
+      passed: designExists && ['success', 'error_max_turns'].includes(result.exitReason),
+    });
+
+    expect(['success', 'error_max_turns']).toContain(result.exitReason);
+    // DESIGN.md export is best-effort — agent may not always produce it
+    if (designExists) {
+      expect(hasTypography || hasColor).toBe(true);
+    }
+  }, 420_000);
+});
+
+// --- QA Design Review E2E ---
+
+describeE2E('QA Design Review E2E', () => {
+  let qaDesignDir: string;
+  let qaDesignServer: ReturnType<typeof Bun.serve> | null = null;
+
+  beforeAll(() => {
+    qaDesignDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-qa-design-'));
+    setupBrowseShims(qaDesignDir);
+
+    const { spawnSync } = require('child_process');
+    const run = (cmd: string, args: string[]) =>
+      spawnSync(cmd, args, { cwd: qaDesignDir, stdio: 'pipe', timeout: 5000 });
+
+    run('git', ['init']);
+    run('git', ['config', 'user.email', 'test@test.com']);
+    run('git', ['config', 'user.name', 'Test']);
+
+    // Create HTML/CSS with intentional design issues
+    fs.writeFileSync(path.join(qaDesignDir, 'index.html'), `<!DOCTYPE html>
+<html lang="en">
+<head>
+  <meta charset="utf-8">
+  <meta name="viewport" content="width=device-width, initial-scale=1">
+  <title>Design Test App</title>
+  <link rel="stylesheet" href="style.css">
+</head>
+<body>
+  <header>
+    <h1 style="font-size: 48px; color: #333;">Welcome</h1>
+    <h2 style="font-size: 47px; color: #334;">Subtitle Here</h2>
+  </header>
+  <main>
+    <div class="card" style="padding: 10px; margin: 20px;">
+      <h3 style="color: blue;">Card Title</h3>
+      <p style="color: #666; font-size: 14px; line-height: 1.2;">Some content here with tight line height.</p>
+    </div>
+    <div class="card" style="padding: 30px; margin: 5px;">
+      <h3 style="color: green;">Another Card</h3>
+      <p style="color: #999; font-size: 16px;">Different spacing and colors for no reason.</p>
+    </div>
+    <button style="background: red; color: white; padding: 5px 10px; border: none;">Click Me</button>
+    <button style="background: #007bff; color: white; padding: 12px 24px; border: none; border-radius: 20px;">Also Click</button>
+  </main>
+</body>
+</html>`);
+
+    fs.writeFileSync(path.join(qaDesignDir, 'style.css'), `body {
+  font-family: Arial, sans-serif;
+  margin: 0;
+  padding: 20px;
+}
+.card {
+  border: 1px solid #ddd;
+  border-radius: 4px;
+}
+`);
+
+    run('git', ['add', '.']);
+    run('git', ['commit', '-m', 'initial design test page']);
+
+    // Start a simple file server for the design test page
+    qaDesignServer = Bun.serve({
+      port: 0,
+      fetch(req) {
+        const url = new URL(req.url);
+        const filePath = path.join(qaDesignDir, url.pathname === '/' ? 'index.html' : url.pathname.slice(1));
+        try {
+          const content = fs.readFileSync(filePath);
+          const ext = path.extname(filePath);
+          const contentType = ext === '.css' ? 'text/css' : ext === '.html' ? 'text/html' : 'text/plain';
+          return new Response(content, { headers: { 'Content-Type': contentType } });
+        } catch {
+          return new Response('Not Found', { status: 404 });
+        }
+      },
+    });
+
+    // Copy qa-design-review skill
+    fs.mkdirSync(path.join(qaDesignDir, 'qa-design-review'), { recursive: true });
+    fs.copyFileSync(
+      path.join(ROOT, 'qa-design-review', 'SKILL.md'),
+      path.join(qaDesignDir, 'qa-design-review', 'SKILL.md'),
+    );
+  });
+
+  afterAll(() => {
+    qaDesignServer?.stop();
+    try { fs.rmSync(qaDesignDir, { recursive: true, force: true }); } catch {}
+  });
+
+  test('Test 7: /qa-design-review audits and fixes design issues', async () => {
+    const serverUrl = `http://localhost:${(qaDesignServer as any)?.port}`;
+
+    const result = await runSkillTest({
+      prompt: `IMPORTANT: The browse binary is already assigned below as B. Do NOT search for it or run the SKILL.md setup block — just use $B directly.
+
+B="${browseBin}"
+
+Read qa-design-review/SKILL.md for the design review + fix workflow.
+
+Review the site at ${serverUrl}. Use --quick mode. Skip any AskUserQuestion calls — this is non-interactive. Fix up to 3 issues max. Write your report to ./design-audit.md.`,
+      workingDirectory: qaDesignDir,
+      maxTurns: 30,
+      timeout: 360_000,
+      testName: 'qa-design-review-fix',
+      runId,
+    });
+
+    logCost('/qa-design-review fix', result);
+
+    const reportPath = path.join(qaDesignDir, 'design-audit.md');
+    const reportExists = fs.existsSync(reportPath);
+
+    // Check if any design fix commits were made
+    const gitLog = spawnSync('git', ['log', '--oneline'], {
+      cwd: qaDesignDir, stdio: 'pipe',
+    });
+    const commits = gitLog.stdout.toString().trim().split('\n');
+    const designFixCommits = commits.filter((c: string) => c.includes('style(design)'));
+
+    recordE2E('/qa-design-review fix', 'QA Design Review E2E', result, {
+      passed: ['success', 'error_max_turns'].includes(result.exitReason),
+    });
+
+    // Accept error_max_turns — the fix loop is complex
+    expect(['success', 'error_max_turns']).toContain(result.exitReason);
+
+    // Report and commits are best-effort — log what happened
+    if (reportExists) {
+      const report = fs.readFileSync(reportPath, 'utf-8');
+      console.log(`Design audit report: ${report.length} chars`);
+    } else {
+      console.warn('No design-audit.md generated');
+    }
+    console.log(`Design fix commits: ${designFixCommits.length}`);
+  }, 420_000);
+});
+
 // Module-level afterAll — finalize eval collector after all tests complete
 afterAll(async () => {
   if (evalCollector) {
diff --git a/test/skill-validation.test.ts b/test/skill-validation.test.ts
index cbb74d13..83cdca6e 100644
--- a/test/skill-validation.test.ts
+++ b/test/skill-validation.test.ts
@@ -57,6 +57,34 @@ describe('SKILL.md command validation', () => {
     const result = validateSkill(qaOnlySkill);
     expect(result.snapshotFlagErrors).toHaveLength(0);
   });
+
+  test('all $B commands in plan-design-review/SKILL.md are valid browse commands', () => {
+    const skill = path.join(ROOT, 'plan-design-review', 'SKILL.md');
+    if (!fs.existsSync(skill)) return;
+    const result = validateSkill(skill);
+    expect(result.invalid).toHaveLength(0);
+  });
+
+  test('all snapshot flags in plan-design-review/SKILL.md are valid', () => {
+    const skill = path.join(ROOT, 'plan-design-review', 'SKILL.md');
+    if (!fs.existsSync(skill)) return;
+    const result = validateSkill(skill);
+    expect(result.snapshotFlagErrors).toHaveLength(0);
+  });
+
+  test('all $B commands in qa-design-review/SKILL.md are valid browse commands', () => {
+    const skill = path.join(ROOT, 'qa-design-review', 'SKILL.md');
+    if (!fs.existsSync(skill)) return;
+    const result = validateSkill(skill);
+    expect(result.invalid).toHaveLength(0);
+  });
+
+  test('all snapshot flags in qa-design-review/SKILL.md are valid', () => {
+    const skill = path.join(ROOT, 'qa-design-review', 'SKILL.md');
+    if (!fs.existsSync(skill)) return;
+    const result = validateSkill(skill);
+    expect(result.snapshotFlagErrors).toHaveLength(0);
+  });
 });
 
 describe('Command registry consistency', () => {
@@ -176,6 +204,9 @@ describe('Update check preamble', () => {
     'ship/SKILL.md', 'review/SKILL.md',
     'plan-ceo-review/SKILL.md', 'plan-eng-review/SKILL.md',
     'retro/SKILL.md',
+    'plan-design-review/SKILL.md',
+    'qa-design-review/SKILL.md',
+    'design-consultation/SKILL.md',
     'document-release/SKILL.md',
   ];
 
@@ -481,6 +512,9 @@ describe('v0.4.1 preamble features', () => {
     'ship/SKILL.md', 'review/SKILL.md',
     'plan-ceo-review/SKILL.md', 'plan-eng-review/SKILL.md',
     'retro/SKILL.md',
+    'plan-design-review/SKILL.md',
+    'qa-design-review/SKILL.md',
+    'design-consultation/SKILL.md',
     'document-release/SKILL.md',
   ];
 

From c8c2cbba33ac7037d9196d545be8effed8bba9db Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 08:10:01 -0500
Subject: [PATCH 09/22] docs: add /design-consultation skill to README (#127)

The skill was fully implemented but completely absent from the README.
Add it to the skill table, write a detailed section with usage example,
and include it in install/uninstall instructions.

Co-authored-by: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 README.md | 73 ++++++++++++++++++++++++++++++++++++++++++++++++++++---
 1 file changed, 69 insertions(+), 4 deletions(-)

diff --git a/README.md b/README.md
index 1db8d1de..de6144ed 100644
--- a/README.md
+++ b/README.md
@@ -2,7 +2,7 @@
 
 **gstack turns Claude Code from one generic assistant into a team of specialists you can summon on demand.**
 
-Twelve opinionated workflow skills for [Claude Code](https://docs.anthropic.com/en/docs/claude-code). Plan review, design review, code review, one-command shipping, browser automation, QA testing, engineering retrospectives, and post-ship documentation — all as slash commands.
+Thirteen opinionated workflow skills for [Claude Code](https://docs.anthropic.com/en/docs/claude-code). Plan review, design review, code review, one-command shipping, browser automation, QA testing, engineering retrospectives, and post-ship documentation — all as slash commands.
 
 ### Without gstack
 
@@ -20,6 +20,7 @@ Twelve opinionated workflow skills for [Claude Code](https://docs.anthropic.com/
 | `/plan-ceo-review` | Founder / CEO | Rethink the problem. Find the 10-star product hiding inside the request. |
 | `/plan-eng-review` | Eng manager / tech lead | Lock in architecture, data flow, diagrams, edge cases, and tests. |
 | `/plan-design-review` | Senior product designer | Designer's eye audit. 80-item checklist, letter grades, AI Slop detection, DESIGN.md inference. Report only — never touches code. |
+| `/design-consultation` | Design consultant | Build a complete design system from scratch. Researches competitors, proposes aesthetic + typography + color + spacing + motion, generates a preview page, and writes DESIGN.md. |
 | `/review` | Paranoid staff engineer | Find the bugs that pass CI but blow up in production. Triages Greptile review comments. |
 | `/ship` | Release engineer | Sync main, run tests, resolve Greptile reviews, push, open PR. For a ready branch, not for deciding what to build. |
 | `/browse` | QA engineer | Give the agent eyes. It logs in, clicks through your app, takes screenshots, catches breakage. Full QA pass in 60 seconds. |
@@ -131,11 +132,11 @@ This is the setup I use. One person, ten parallel agents, each with the right co
 
 Open Claude Code and paste this. Claude will do the rest.
 
-> Install gstack: run `git clone https://github.com/garrytan/gstack.git ~/.claude/skills/gstack && cd ~/.claude/skills/gstack && ./setup` then add a "gstack" section to CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, and lists the available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review, /review, /ship, /browse, /qa, /qa-only, /qa-design-review, /setup-browser-cookies, /retro, /document-release. Then ask the user if they also want to add gstack to the current project so teammates get it.
+> Install gstack: run `git clone https://github.com/garrytan/gstack.git ~/.claude/skills/gstack && cd ~/.claude/skills/gstack && ./setup` then add a "gstack" section to CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, and lists the available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review, /design-consultation, /review, /ship, /browse, /qa, /qa-only, /qa-design-review, /setup-browser-cookies, /retro, /document-release. Then ask the user if they also want to add gstack to the current project so teammates get it.
 
 ### Step 2: Add to your repo so teammates get it (optional)
 
-> Add gstack to this project: run `cp -Rf ~/.claude/skills/gstack .claude/skills/gstack && rm -rf .claude/skills/gstack/.git && cd .claude/skills/gstack && ./setup` then add a "gstack" section to this project's CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, lists the available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review, /review, /ship, /browse, /qa, /qa-only, /qa-design-review, /setup-browser-cookies, /retro, /document-release, and tells Claude that if gstack skills aren't working, run `cd .claude/skills/gstack && ./setup` to build the binary and register skills.
+> Add gstack to this project: run `cp -Rf ~/.claude/skills/gstack .claude/skills/gstack && rm -rf .claude/skills/gstack/.git && cd .claude/skills/gstack && ./setup` then add a "gstack" section to this project's CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, lists the available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review, /design-consultation, /review, /ship, /browse, /qa, /qa-only, /qa-design-review, /setup-browser-cookies, /retro, /document-release, and tells Claude that if gstack skills aren't working, run `cd .claude/skills/gstack && ./setup` to build the binary and register skills.
 
 Real files get committed to your repo (not a submodule), so `git clone` just works. The binary and node\_modules are gitignored — teammates just need to run `cd .claude/skills/gstack && ./setup` once to build (or `/browse` handles it automatically on first use).
 
@@ -337,6 +338,70 @@ This is report only — it never touches your code. Use `/qa-design-review` when
 
 ---
 
+## `/design-consultation`
+
+This is my **design partner mode**.
+
+`/plan-design-review` audits a site that already exists. `/design-consultation` is for when you have nothing yet — no design system, no font choices, no color palette. You are starting from zero and you want a senior designer to sit down with you and build the whole visual identity together.
+
+It is a conversation, not a form. The agent asks about your product, your users, and your space. If you want, it researches what top competitors in your category are doing — fonts, colors, layout patterns, aesthetic direction. Then it proposes a complete, coherent design system: aesthetic direction, typography (3+ fonts with specific roles), color palette with hex values, spacing scale, layout approach, and motion strategy. Every recommendation comes with a rationale. Every choice reinforces every other choice.
+
+The key insight: individual design decisions are easy to make but hard to make coherently. Picking a font is simple. Picking a font that works with your color palette, your spacing density, your aesthetic direction, and your product's personality — that is the actual job. `/design-consultation` solves the coherence problem by proposing everything as one package, then letting you adjust any piece while it checks that the rest still holds together.
+
+After you agree on the system, it generates an interactive HTML preview page — your fonts rendered at real sizes, your color palette as actual UI components (buttons, cards, form inputs, alerts), light/dark mode toggle, all using your product name instead of lorem ipsum. You open the page in your browser and see the design system rendered before a single line of product code is written.
+
+Then it writes `DESIGN.md` to your repo root — your project's design source of truth — and updates `CLAUDE.md` so every future Claude Code session respects the system. From that point on, `/qa-design-review` can audit against it, and any agent working on your frontend knows the rules.
+
+```
+You:   /design-consultation
+
+Claude: From the README, this looks like a developer analytics dashboard
+        for engineering teams. Sound right? And would you like me to
+        research what other dev tools are doing for design, or should
+        I work from what I know?
+
+You:    Yes, it's a dashboard for eng managers. Research would be great.
+
+Claude: I looked at Linear, Vercel, Railway, Planetscale, and Posthog.
+        They converge on clean sans-serifs and muted palettes, but
+        Linear stands out with its dark-first approach and tight spacing.
+        The gap: most of these feel interchangeable. Here's my proposal:
+
+        AESTHETIC: Industrial/Utilitarian — data-first, no decoration tax
+        TYPOGRAPHY: Geist (body + UI), Instrument Serif (display), JetBrains Mono (data)
+        COLOR: Restrained — slate neutrals, single teal accent (#0D9488)
+        SPACING: 4px base, compact density
+        LAYOUT: Grid-disciplined, 12-column
+        MOTION: Minimal-functional — only transitions that aid comprehension
+
+        This coheres because the utilitarian aesthetic demands a tight
+        spacing grid and restrained color. The serif display font creates
+        hierarchy contrast without adding visual noise. The monospace for
+        data tables feels native to the engineering audience.
+
+        Want to adjust anything, or should I generate the preview page?
+
+You:    Generate it.
+
+Claude: Preview opened in your browser.
+        [/tmp/design-consultation-preview-1710000000.html]
+
+        The page shows Instrument Serif at hero scale, Geist in body
+        paragraphs, JetBrains Mono in a sample data table. Color swatches
+        with your teal accent against slate grays. Buttons, cards, and
+        alerts rendered in both light and dark mode.
+
+        How does it feel? Want to adjust anything before I write DESIGN.md?
+
+You:    Looks great. Ship it.
+
+Claude: Wrote DESIGN.md (typography, color, spacing, layout, motion).
+        Updated CLAUDE.md with design system guidelines.
+        All future sessions will respect these choices.
+```
+
+---
+
 ## `/qa-design-review`
 
 This is my **designer who codes mode**.
@@ -757,7 +822,7 @@ Or set `auto_upgrade: true` in `~/.gstack/config.yaml` to upgrade automatically
 
 Paste this into Claude Code:
 
-> Uninstall gstack: remove the skill symlinks by running `for s in browse plan-ceo-review plan-eng-review plan-design-review review ship retro qa qa-only qa-design-review setup-browser-cookies document-release; do rm -f ~/.claude/skills/$s; done` then run `rm -rf ~/.claude/skills/gstack` and remove the gstack section from CLAUDE.md. If this project also has gstack at .claude/skills/gstack, remove it by running `for s in browse plan-ceo-review plan-eng-review plan-design-review review ship retro qa qa-only qa-design-review setup-browser-cookies document-release; do rm -f .claude/skills/$s; done && rm -rf .claude/skills/gstack` and remove the gstack section from the project CLAUDE.md too.
+> Uninstall gstack: remove the skill symlinks by running `for s in browse plan-ceo-review plan-eng-review plan-design-review design-consultation review ship retro qa qa-only qa-design-review setup-browser-cookies document-release; do rm -f ~/.claude/skills/$s; done` then run `rm -rf ~/.claude/skills/gstack` and remove the gstack section from CLAUDE.md. If this project also has gstack at .claude/skills/gstack, remove it by running `for s in browse plan-ceo-review plan-eng-review plan-design-review review ship retro qa qa-only qa-design-review setup-browser-cookies document-release; do rm -f .claude/skills/$s; done && rm -rf .claude/skills/gstack` and remove the gstack section from the project CLAUDE.md too.
 
 ## Development
 

From 5f41cd9ad76aba2d3817498273d174a33e0aadd8 Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 10:30:19 -0500
Subject: [PATCH 10/22] feat: show screenshots to user during QA and browse
 sessions (v0.5.0.1) (#129)

Add rule 11 to QA and Design methodologies in gen-skill-docs.ts
instructing Claude to Read screenshot PNGs after taking them.
This makes screenshots visible as clickable elements in Conductor
and other Claude Code UIs. Also added to browse and gstack SKILL
templates.

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 CHANGELOG.md                | 6 ++++++
 SKILL.md                    | 1 +
 SKILL.md.tmpl               | 1 +
 VERSION                     | 2 +-
 browse/SKILL.md             | 3 +++
 browse/SKILL.md.tmpl        | 3 +++
 plan-design-review/SKILL.md | 1 +
 qa-design-review/SKILL.md   | 1 +
 qa-only/SKILL.md            | 1 +
 qa/SKILL.md                 | 1 +
 scripts/gen-skill-docs.ts   | 6 ++++--
 11 files changed, 23 insertions(+), 3 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index a86569c8..92a45858 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,11 @@
 # Changelog
 
+## 0.5.0.1 — 2026-03-17
+
+### Fixed
+
+- **Screenshots are now visible during QA and browse sessions.** When gstack takes screenshots, they now show up as clickable image elements in your output — no more invisible `/tmp/browse-screenshot.png` paths you can't see. Works in `/qa`, `/qa-only`, `/plan-design-review`, `/qa-design-review`, `/browse`, and `/gstack`.
+
 ## 0.5.0 — 2026-03-16
 
 - **Your site just got a design review.** `/plan-design-review` opens your site and reviews it like a senior product designer — typography, spacing, hierarchy, color, responsive, interactions, and AI slop detection. Get letter grades (A-F) per category, a dual headline "Design Score" + "AI Slop Score", and a structured first impression that doesn't pull punches.
diff --git a/SKILL.md b/SKILL.md
index 76007eee..c0d6e267 100644
--- a/SKILL.md
+++ b/SKILL.md
@@ -111,6 +111,7 @@ If `NEEDS_SETUP`:
 - NEVER use `mcp__claude-in-chrome__*` tools. They are slow and unreliable.
 - Browser persists between calls — cookies, login sessions, and tabs carry over.
 - Dialogs (alert/confirm/prompt) are auto-accepted by default — no browser lockup.
+- **Show screenshots:** After `$B screenshot`, `$B snapshot -a -o`, or `$B responsive`, always use the Read tool on the output PNG(s) so the user can see them. Without this, screenshots are invisible.
 
 ## QA Workflows
 
diff --git a/SKILL.md.tmpl b/SKILL.md.tmpl
index 7f2e11db..dd2b2345 100644
--- a/SKILL.md.tmpl
+++ b/SKILL.md.tmpl
@@ -29,6 +29,7 @@ Auto-shuts down after 30 min idle. State persists between calls (cookies, tabs,
 - NEVER use `mcp__claude-in-chrome__*` tools. They are slow and unreliable.
 - Browser persists between calls — cookies, login sessions, and tabs carry over.
 - Dialogs (alert/confirm/prompt) are auto-accepted by default — no browser lockup.
+- **Show screenshots:** After `$B screenshot`, `$B snapshot -a -o`, or `$B responsive`, always use the Read tool on the output PNG(s) so the user can see them. Without this, screenshots are invisible.
 
 ## QA Workflows
 
diff --git a/VERSION b/VERSION
index 8f0916f7..494bbc1a 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.5.0
+0.5.0.1
diff --git a/browse/SKILL.md b/browse/SKILL.md
index dd473dc0..33accc09 100644
--- a/browse/SKILL.md
+++ b/browse/SKILL.md
@@ -184,6 +184,9 @@ $B snapshot -D                   # verify deletion happened
 $B diff https://staging.app.com https://prod.app.com
 ```
 
+### 11. Show screenshots to the user
+After `$B screenshot`, `$B snapshot -a -o`, or `$B responsive`, always use the Read tool on the output PNG(s) so the user can see them. Without this, screenshots are invisible.
+
 ## Snapshot Flags
 
 The snapshot is your primary tool for understanding and interacting with pages.
diff --git a/browse/SKILL.md.tmpl b/browse/SKILL.md.tmpl
index 6ce20634..0c42ffcb 100644
--- a/browse/SKILL.md.tmpl
+++ b/browse/SKILL.md.tmpl
@@ -102,6 +102,9 @@ $B snapshot -D                   # verify deletion happened
 $B diff https://staging.app.com https://prod.app.com
 ```
 
+### 11. Show screenshots to the user
+After `$B screenshot`, `$B snapshot -a -o`, or `$B responsive`, always use the Read tool on the output PNG(s) so the user can see them. Without this, screenshots are invisible.
+
 ## Snapshot Flags
 
 {{SNAPSHOT_FLAGS}}
diff --git a/plan-design-review/SKILL.md b/plan-design-review/SKILL.md
index c0ca9512..1231d968 100644
--- a/plan-design-review/SKILL.md
+++ b/plan-design-review/SKILL.md
@@ -465,6 +465,7 @@ Tie everything to user goals and product objectives. Always suggest specific imp
 8. **Responsive is design, not just "not broken."** A stacked desktop layout on mobile is not responsive design — it's lazy. Evaluate whether the mobile layout makes *design* sense.
 9. **Document incrementally.** Write each finding to the report as you find it. Don't batch.
 10. **Depth over breadth.** 5-10 well-documented findings with screenshots and specific suggestions > 20 vague observations.
+11. **Show screenshots to the user.** After every `$B screenshot`, `$B snapshot -a -o`, or `$B responsive` command, use the Read tool on the output file(s) so the user can see them inline. For `responsive` (3 files), Read all three. This is critical — without it, screenshots are invisible to the user.
 
 ---
 
diff --git a/qa-design-review/SKILL.md b/qa-design-review/SKILL.md
index 08c9916a..7fa0b856 100644
--- a/qa-design-review/SKILL.md
+++ b/qa-design-review/SKILL.md
@@ -477,6 +477,7 @@ Tie everything to user goals and product objectives. Always suggest specific imp
 8. **Responsive is design, not just "not broken."** A stacked desktop layout on mobile is not responsive design — it's lazy. Evaluate whether the mobile layout makes *design* sense.
 9. **Document incrementally.** Write each finding to the report as you find it. Don't batch.
 10. **Depth over breadth.** 5-10 well-documented findings with screenshots and specific suggestions > 20 vague observations.
+11. **Show screenshots to the user.** After every `$B screenshot`, `$B snapshot -a -o`, or `$B responsive` command, use the Read tool on the output file(s) so the user can see them inline. For `responsive` (3 files), Read all three. This is critical — without it, screenshots are invisible to the user.
 
 Record baseline design score and AI slop score at end of Phase 6.
 
diff --git a/qa-only/SKILL.md b/qa-only/SKILL.md
index 5e74f03e..ed732bf5 100644
--- a/qa-only/SKILL.md
+++ b/qa-only/SKILL.md
@@ -415,6 +415,7 @@ Minimum 0 per category.
 8. **Depth over breadth.** 5-10 well-documented issues with evidence > 20 vague descriptions.
 9. **Never delete output files.** Screenshots and reports accumulate — that's intentional.
 10. **Use `snapshot -C` for tricky UIs.** Finds clickable divs that the accessibility tree misses.
+11. **Show screenshots to the user.** After every `$B screenshot`, `$B snapshot -a -o`, or `$B responsive` command, use the Read tool on the output file(s) so the user can see them inline. For `responsive` (3 files), Read all three. This is critical — without it, screenshots are invisible to the user.
 
 ---
 
diff --git a/qa/SKILL.md b/qa/SKILL.md
index 6b078a9d..ac12fc94 100644
--- a/qa/SKILL.md
+++ b/qa/SKILL.md
@@ -454,6 +454,7 @@ Minimum 0 per category.
 8. **Depth over breadth.** 5-10 well-documented issues with evidence > 20 vague descriptions.
 9. **Never delete output files.** Screenshots and reports accumulate — that's intentional.
 10. **Use `snapshot -C` for tricky UIs.** Finds clickable divs that the accessibility tree misses.
+11. **Show screenshots to the user.** After every `$B screenshot`, `$B snapshot -a -o`, or `$B responsive` command, use the Read tool on the output file(s) so the user can see them inline. For `responsive` (3 files), Read all three. This is critical — without it, screenshots are invisible to the user.
 
 Record baseline health score at end of Phase 6.
 
diff --git a/scripts/gen-skill-docs.ts b/scripts/gen-skill-docs.ts
index 7a0b85ab..5d5f84bb 100644
--- a/scripts/gen-skill-docs.ts
+++ b/scripts/gen-skill-docs.ts
@@ -476,7 +476,8 @@ Minimum 0 per category.
 7. **Test like a user.** Use realistic data. Walk through complete workflows end-to-end.
 8. **Depth over breadth.** 5-10 well-documented issues with evidence > 20 vague descriptions.
 9. **Never delete output files.** Screenshots and reports accumulate — that's intentional.
-10. **Use \`snapshot -C\` for tricky UIs.** Finds clickable divs that the accessibility tree misses.`;
+10. **Use \`snapshot -C\` for tricky UIs.** Finds clickable divs that the accessibility tree misses.
+11. **Show screenshots to the user.** After every \`$B screenshot\`, \`$B snapshot -a -o\`, or \`$B responsive\` command, use the Read tool on the output file(s) so the user can see them inline. For \`responsive\` (3 files), Read all three. This is critical — without it, screenshots are invisible to the user.`;
 }
 
 function generateDesignMethodology(): string {
@@ -809,7 +810,8 @@ Tie everything to user goals and product objectives. Always suggest specific imp
 7. **Use \`snapshot -C\` for tricky UIs.** Finds clickable divs that the accessibility tree misses.
 8. **Responsive is design, not just "not broken."** A stacked desktop layout on mobile is not responsive design — it's lazy. Evaluate whether the mobile layout makes *design* sense.
 9. **Document incrementally.** Write each finding to the report as you find it. Don't batch.
-10. **Depth over breadth.** 5-10 well-documented findings with screenshots and specific suggestions > 20 vague observations.`;
+10. **Depth over breadth.** 5-10 well-documented findings with screenshots and specific suggestions > 20 vague observations.
+11. **Show screenshots to the user.** After every \`$B screenshot\`, \`$B snapshot -a -o\`, or \`$B responsive\` command, use the Read tool on the output file(s) so the user can see them inline. For \`responsive\` (3 files), Read all three. This is critical — without it, screenshots are invisible to the user.`;
 }
 
 const RESOLVERS: Record<string, () => string> = {

From 73b00b4e29eef5164e166a06db2df255edd4c379 Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 10:33:46 -0500
Subject: [PATCH 11/22] feat: Review Readiness Dashboard + gstack-slug helper
 (v0.5.1) (#130)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* feat: add bin/gstack-slug helper + migrate all inline SLUG computation

Extract the opaque SLUG sed pipeline into a shared 5-line shell script.
Replace 8 inline copies across templates with eval $(gstack-slug).
Sanitizes branch names (/ → -) to prevent subdirectory creation.

* feat: review readiness dashboard — track CEO/Eng/Design reviews per branch

Each review skill logs its result to JSONL. A shared {{REVIEW_DASHBOARD}}
placeholder displays run counts, timestamps, and a CLEARED TO SHIP verdict.
/ship pre-flight reads the dashboard and prompts when reviews are missing.

* chore: bump version and changelog (v0.5.1)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 CHANGELOG.md                      | 13 ++++++--
 TODOS.md                          | 26 ++++++++++++++++
 VERSION                           |  2 +-
 bin/gstack-slug                   |  9 ++++++
 design-consultation/SKILL.md      |  2 +-
 design-consultation/SKILL.md.tmpl |  2 +-
 plan-ceo-review/SKILL.md          | 47 +++++++++++++++++++++++++++++
 plan-ceo-review/SKILL.md.tmpl     | 19 ++++++++++++
 plan-design-review/SKILL.md       | 48 ++++++++++++++++++++++++++++-
 plan-design-review/SKILL.md.tmpl  | 18 +++++++++++
 plan-eng-review/SKILL.md          | 50 +++++++++++++++++++++++++++++--
 plan-eng-review/SKILL.md.tmpl     | 22 ++++++++++++--
 qa-design-review/SKILL.md         |  4 +--
 qa-design-review/SKILL.md.tmpl    |  2 +-
 qa-only/SKILL.md                  |  4 +--
 qa-only/SKILL.md.tmpl             |  4 +--
 qa/SKILL.md                       |  4 +--
 qa/SKILL.md.tmpl                  |  4 +--
 scripts/gen-skill-docs.ts         | 35 +++++++++++++++++++++-
 ship/SKILL.md                     | 37 +++++++++++++++++++++++
 ship/SKILL.md.tmpl                |  9 ++++++
 test/gen-skill-docs.test.ts       | 27 +++++++++++++++++
 test/skill-validation.test.ts     | 42 ++++++++++++++++++++++++++
 23 files changed, 407 insertions(+), 23 deletions(-)
 create mode 100755 bin/gstack-slug

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 92a45858..a4bd0786 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,11 +1,18 @@
 # Changelog
 
-## 0.5.0.1 — 2026-03-17
-
-### Fixed
+## 0.5.1 — 2026-03-17
 
+- **Know where you stand before you ship.** Every `/plan-ceo-review`, `/plan-eng-review`, and `/plan-design-review` now logs its result to a review tracker. At the end of each review, you see a **Review Readiness Dashboard** showing which reviews are done, when they ran, and whether they're clean — with a clear CLEARED TO SHIP or NOT READY verdict.
+- **`/ship` checks your reviews before creating the PR.** Pre-flight now reads the dashboard and asks if you want to continue when reviews are missing. Informational only — it won't block you, but you'll know what you skipped.
+- **One less thing to copy-paste.** The SLUG computation (that opaque sed pipeline for computing `owner-repo` from git remote) is now a shared `bin/gstack-slug` helper. All 14 inline copies across templates replaced with `eval $(gstack-slug)`. If the format ever changes, fix it once.
 - **Screenshots are now visible during QA and browse sessions.** When gstack takes screenshots, they now show up as clickable image elements in your output — no more invisible `/tmp/browse-screenshot.png` paths you can't see. Works in `/qa`, `/qa-only`, `/plan-design-review`, `/qa-design-review`, `/browse`, and `/gstack`.
 
+### For contributors
+
+- Added `{{REVIEW_DASHBOARD}}` resolver to `gen-skill-docs.ts` — shared dashboard reader injected into 4 templates (3 review skills + ship).
+- Added `bin/gstack-slug` helper (5-line bash) with unit tests. Outputs `SLUG=` and `BRANCH=` lines, sanitizes `/` to `-`.
+- New TODOs: smart review relevance detection (P3), `/merge` skill for review-gated PR merge (P2).
+
 ## 0.5.0 — 2026-03-16
 
 - **Your site just got a design review.** `/plan-design-review` opens your site and reviews it like a senior product designer — typography, spacing, hierarchy, color, responsive, interactions, and AI slop detection. Get letter grades (A-F) per category, a dual headline "Design Score" + "AI Slop Score", and a structured first impression that doesn't pull punches.
diff --git a/TODOS.md b/TODOS.md
index d76f71c4..f52bb693 100644
--- a/TODOS.md
+++ b/TODOS.md
@@ -408,6 +408,32 @@ Shipped as `/design-consultation` on garrytan/design branch. Renamed from `/setu
 **Priority:** P2
 **Depends on:** None
 
+## Ship Confidence Dashboard
+
+### Smart review relevance detection
+
+**What:** Auto-detect which of the 4 reviews are relevant based on branch changes (skip Design Review if no CSS/view changes, skip Code Review if plan-only).
+
+**Why:** Currently dashboard always shows 4 rows. On docs-only changes, "Design Review: NOT YET RUN" is noise.
+
+**Context:** /plan-design-review and /qa already do file-type detection in diff-aware mode. Could reuse that heuristic. Would require a `gstack-diff-scope` helper or enriching `gstack-slug` to also output change categories.
+
+**Effort:** M
+**Priority:** P3
+**Depends on:** Ship Confidence Dashboard (shipped)
+
+### /merge skill — review-gated PR merge
+
+**What:** Create a `/merge` skill that merges an approved PR, but first checks the Review Readiness Dashboard and runs `/review` (Fix-First) if code review hasn't been done. Separates "ship" (create PR) from "merge" (land it).
+
+**Why:** Currently `/review` runs inside `/ship` Step 3.5 but isn't tracked as a gate. A `/merge` skill ensures code review always happens before landing, and enables workflows where someone else reviews the PR first.
+
+**Context:** `/ship` creates the PR. `/merge` would: check dashboard → run `/review` if needed → `gh pr merge`. This is where code review tracking belongs — at merge time, not at plan time.
+
+**Effort:** M
+**Priority:** P2
+**Depends on:** Ship Confidence Dashboard (shipped)
+
 ## Completed
 
 ### Phase 1: Foundations (v0.2.0)
diff --git a/VERSION b/VERSION
index 494bbc1a..4b9fcbec 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.5.0.1
+0.5.1
diff --git a/bin/gstack-slug b/bin/gstack-slug
new file mode 100755
index 00000000..7336b7b4
--- /dev/null
+++ b/bin/gstack-slug
@@ -0,0 +1,9 @@
+#!/usr/bin/env bash
+# gstack-slug — output project slug and sanitized branch name
+# Usage: eval $(gstack-slug)  → sets SLUG and BRANCH variables
+# Or:    gstack-slug           → prints SLUG=... and BRANCH=... lines
+set -euo pipefail
+SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+BRANCH=$(git rev-parse --abbrev-ref HEAD 2>/dev/null | tr '/' '-')
+echo "SLUG=$SLUG"
+echo "BRANCH=$BRANCH"
diff --git a/design-consultation/SKILL.md b/design-consultation/SKILL.md
index d92d47fd..0d919950 100644
--- a/design-consultation/SKILL.md
+++ b/design-consultation/SKILL.md
@@ -114,7 +114,7 @@ ls src/ app/ pages/ components/ 2>/dev/null | head -30
 Look for brainstorm output:
 
 ```bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 ls ~/.gstack/projects/$SLUG/*brainstorm* 2>/dev/null | head -5
 ls .context/*brainstorm* .context/attachments/*brainstorm* 2>/dev/null | head -5
 ```
diff --git a/design-consultation/SKILL.md.tmpl b/design-consultation/SKILL.md.tmpl
index 11d868fa..ef5044fb 100644
--- a/design-consultation/SKILL.md.tmpl
+++ b/design-consultation/SKILL.md.tmpl
@@ -49,7 +49,7 @@ ls src/ app/ pages/ components/ 2>/dev/null | head -30
 Look for brainstorm output:
 
 ```bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 ls ~/.gstack/projects/$SLUG/*brainstorm* 2>/dev/null | head -5
 ls .context/*brainstorm* .context/attachments/*brainstorm* 2>/dev/null | head -5
 ```
diff --git a/plan-ceo-review/SKILL.md b/plan-ceo-review/SKILL.md
index b05db5e9..033f4e5f 100644
--- a/plan-ceo-review/SKILL.md
+++ b/plan-ceo-review/SKILL.md
@@ -534,6 +534,53 @@ List every ASCII diagram in files this plan touches. Still accurate?
 ### Unresolved Decisions
 If any AskUserQuestion goes unanswered, note it here. Never silently default.
 
+## Review Log
+
+After producing the Completion Summary above, persist the review result:
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+mkdir -p ~/.gstack/projects/$SLUG
+echo '{"skill":"plan-ceo-review","timestamp":"TIMESTAMP","status":"STATUS","unresolved":N,"critical_gaps":N,"mode":"MODE"}' >> ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl
+```
+
+Before running this command, substitute the placeholder values from the Completion Summary you just produced:
+- **TIMESTAMP**: current ISO 8601 datetime (e.g., 2026-03-16T14:30:00)
+- **STATUS**: "clean" if 0 unresolved decisions AND 0 critical gaps; otherwise "issues_open"
+- **unresolved**: number from "Unresolved decisions" in the summary
+- **critical_gaps**: number from "Failure modes: ___ CRITICAL GAPS" in the summary
+- **MODE**: the mode the user selected (SCOPE_EXPANSION / HOLD_SCOPE / SCOPE_REDUCTION)
+
+## Review Readiness Dashboard
+
+After completing the review, read the review log to display the dashboard.
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+cat ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl 2>/dev/null || echo "NO_REVIEWS"
+```
+
+Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
+
+```
++====================================================================+
+|                    REVIEW READINESS DASHBOARD                       |
++====================================================================+
+| Review          | Runs | Last Run            | Status               |
+|-----------------|------|---------------------|----------------------|
+| CEO Review      |  1   | 2026-03-16 14:30    | CLEAR                |
+| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR                |
+| Design Review   |  0   | —                   | NOT YET RUN          |
++--------------------------------------------------------------------+
+| VERDICT: 2/3 CLEAR — Design Review not yet run                      |
++====================================================================+
+```
+
+**Verdict logic:**
+- **CLEARED TO SHIP (3/3)**: All three have >= 1 entry within 7 days AND most recent status is "clean"
+- **N/3 CLEAR**: Show count and list which are missing, have open issues, or are stale (>7 days)
+- Informational only — does NOT block.
+
 ## Formatting Rules
 * NUMBER issues (1, 2, 3...) and LETTERS for options (A, B, C...).
 * Label with NUMBER + LETTER (e.g., "3A", "3B").
diff --git a/plan-ceo-review/SKILL.md.tmpl b/plan-ceo-review/SKILL.md.tmpl
index 9902fafb..8664d095 100644
--- a/plan-ceo-review/SKILL.md.tmpl
+++ b/plan-ceo-review/SKILL.md.tmpl
@@ -452,6 +452,25 @@ List every ASCII diagram in files this plan touches. Still accurate?
 ### Unresolved Decisions
 If any AskUserQuestion goes unanswered, note it here. Never silently default.
 
+## Review Log
+
+After producing the Completion Summary above, persist the review result:
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+mkdir -p ~/.gstack/projects/$SLUG
+echo '{"skill":"plan-ceo-review","timestamp":"TIMESTAMP","status":"STATUS","unresolved":N,"critical_gaps":N,"mode":"MODE"}' >> ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl
+```
+
+Before running this command, substitute the placeholder values from the Completion Summary you just produced:
+- **TIMESTAMP**: current ISO 8601 datetime (e.g., 2026-03-16T14:30:00)
+- **STATUS**: "clean" if 0 unresolved decisions AND 0 critical gaps; otherwise "issues_open"
+- **unresolved**: number from "Unresolved decisions" in the summary
+- **critical_gaps**: number from "Failure modes: ___ CRITICAL GAPS" in the summary
+- **MODE**: the mode the user selected (SCOPE_EXPANSION / HOLD_SCOPE / SCOPE_REDUCTION)
+
+{{REVIEW_DASHBOARD}}
+
 ## Formatting Rules
 * NUMBER issues (1, 2, 3...) and LETTERS for options (A, B, C...).
 * Label with NUMBER + LETTER (e.g., "3A", "3B").
diff --git a/plan-design-review/SKILL.md b/plan-design-review/SKILL.md
index 1231d968..8fb0bfeb 100644
--- a/plan-design-review/SKILL.md
+++ b/plan-design-review/SKILL.md
@@ -384,7 +384,7 @@ Compare screenshots and observations across pages for:
 
 **Project-scoped:**
 ```bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 mkdir -p ~/.gstack/projects/$SLUG
 ```
 Write to: `~/.gstack/projects/{slug}/{user}-{branch}-design-audit-{datetime}.md`
@@ -557,3 +557,49 @@ Project type: {web app / dashboard / marketing site / etc.}
 
 11. **Never fix anything.** Find and document only. Do not read source code, edit files, or suggest code fixes. Your job is to report what could be better and suggest design improvements. Use `/qa-design-review` for the fix loop.
 12. **The exception:** You MAY write a DESIGN.md file if the user accepts the offer. This is the only file you create.
+
+## Review Log
+
+After compiling the report, persist the review result:
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+mkdir -p ~/.gstack/projects/$SLUG
+echo '{"skill":"plan-design-review","timestamp":"TIMESTAMP","status":"STATUS","design_score":"GRADE","ai_slop_score":"GRADE","mode":"MODE"}' >> ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl
+```
+
+Substitute values from the report:
+- **TIMESTAMP**: current ISO 8601 datetime
+- **STATUS**: "clean" if Design Score is A or B; "issues_open" if C, D, or F
+- **GRADE**: the letter grade from the report (Design Score and AI Slop Score respectively)
+- **MODE**: Full / Quick / Deep / Diff-aware / Regression
+
+## Review Readiness Dashboard
+
+After completing the review, read the review log to display the dashboard.
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+cat ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl 2>/dev/null || echo "NO_REVIEWS"
+```
+
+Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
+
+```
++====================================================================+
+|                    REVIEW READINESS DASHBOARD                       |
++====================================================================+
+| Review          | Runs | Last Run            | Status               |
+|-----------------|------|---------------------|----------------------|
+| CEO Review      |  1   | 2026-03-16 14:30    | CLEAR                |
+| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR                |
+| Design Review   |  0   | —                   | NOT YET RUN          |
++--------------------------------------------------------------------+
+| VERDICT: 2/3 CLEAR — Design Review not yet run                      |
++====================================================================+
+```
+
+**Verdict logic:**
+- **CLEARED TO SHIP (3/3)**: All three have >= 1 entry within 7 days AND most recent status is "clean"
+- **N/3 CLEAR**: Show count and list which are missing, have open issues, or are stale (>7 days)
+- Informational only — does NOT block.
diff --git a/plan-design-review/SKILL.md.tmpl b/plan-design-review/SKILL.md.tmpl
index b381c682..97546805 100644
--- a/plan-design-review/SKILL.md.tmpl
+++ b/plan-design-review/SKILL.md.tmpl
@@ -145,3 +145,21 @@ Project type: {web app / dashboard / marketing site / etc.}
 
 11. **Never fix anything.** Find and document only. Do not read source code, edit files, or suggest code fixes. Your job is to report what could be better and suggest design improvements. Use `/qa-design-review` for the fix loop.
 12. **The exception:** You MAY write a DESIGN.md file if the user accepts the offer. This is the only file you create.
+
+## Review Log
+
+After compiling the report, persist the review result:
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+mkdir -p ~/.gstack/projects/$SLUG
+echo '{"skill":"plan-design-review","timestamp":"TIMESTAMP","status":"STATUS","design_score":"GRADE","ai_slop_score":"GRADE","mode":"MODE"}' >> ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl
+```
+
+Substitute values from the report:
+- **TIMESTAMP**: current ISO 8601 datetime
+- **STATUS**: "clean" if Design Score is A or B; "issues_open" if C, D, or F
+- **GRADE**: the letter grade from the report (Design Score and AI Slop Score respectively)
+- **MODE**: Full / Quick / Deep / Diff-aware / Regression
+
+{{REVIEW_DASHBOARD}}
diff --git a/plan-eng-review/SKILL.md b/plan-eng-review/SKILL.md
index 4cd8f481..b5c0775b 100644
--- a/plan-eng-review/SKILL.md
+++ b/plan-eng-review/SKILL.md
@@ -154,8 +154,7 @@ For LLM/prompt changes: check the "Prompt/LLM changes" file patterns listed in C
 After producing the test diagram, write a test plan artifact to the project directory so `/qa` and `/qa-only` can consume it as primary test input (replacing the lossy git-diff heuristic):
 
 ```bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
-BRANCH=$(git rev-parse --abbrev-ref HEAD)
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 USER=$(whoami)
 DATETIME=$(date +%Y%m%d-%H%M%S)
 mkdir -p ~/.gstack/projects/$SLUG
@@ -259,5 +258,52 @@ Check the git log for this branch. If there are prior commits suggesting a previ
 * One sentence max per option. Pick in under 5 seconds.
 * After each review section, pause and ask for feedback before moving on.
 
+## Review Log
+
+After producing the Completion Summary above, persist the review result:
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+mkdir -p ~/.gstack/projects/$SLUG
+echo '{"skill":"plan-eng-review","timestamp":"TIMESTAMP","status":"STATUS","unresolved":N,"critical_gaps":N,"mode":"MODE"}' >> ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl
+```
+
+Substitute values from the Completion Summary:
+- **TIMESTAMP**: current ISO 8601 datetime
+- **STATUS**: "clean" if 0 unresolved decisions AND 0 critical gaps; otherwise "issues_open"
+- **unresolved**: number from "Unresolved decisions" count
+- **critical_gaps**: number from "Failure modes: ___ critical gaps flagged"
+- **MODE**: SCOPE_REDUCTION / BIG_CHANGE / SMALL_CHANGE
+
+## Review Readiness Dashboard
+
+After completing the review, read the review log to display the dashboard.
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+cat ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl 2>/dev/null || echo "NO_REVIEWS"
+```
+
+Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
+
+```
++====================================================================+
+|                    REVIEW READINESS DASHBOARD                       |
++====================================================================+
+| Review          | Runs | Last Run            | Status               |
+|-----------------|------|---------------------|----------------------|
+| CEO Review      |  1   | 2026-03-16 14:30    | CLEAR                |
+| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR                |
+| Design Review   |  0   | —                   | NOT YET RUN          |
++--------------------------------------------------------------------+
+| VERDICT: 2/3 CLEAR — Design Review not yet run                      |
++====================================================================+
+```
+
+**Verdict logic:**
+- **CLEARED TO SHIP (3/3)**: All three have >= 1 entry within 7 days AND most recent status is "clean"
+- **N/3 CLEAR**: Show count and list which are missing, have open issues, or are stale (>7 days)
+- Informational only — does NOT block.
+
 ## Unresolved decisions
 If the user does not respond to an AskUserQuestion or interrupts to move on, note which decisions were left unresolved. At the end of the review, list these as "Unresolved decisions that may bite you later" — never silently default to an option.
diff --git a/plan-eng-review/SKILL.md.tmpl b/plan-eng-review/SKILL.md.tmpl
index 410b0726..4905d8d3 100644
--- a/plan-eng-review/SKILL.md.tmpl
+++ b/plan-eng-review/SKILL.md.tmpl
@@ -89,8 +89,7 @@ For LLM/prompt changes: check the "Prompt/LLM changes" file patterns listed in C
 After producing the test diagram, write a test plan artifact to the project directory so `/qa` and `/qa-only` can consume it as primary test input (replacing the lossy git-diff heuristic):
 
 ```bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
-BRANCH=$(git rev-parse --abbrev-ref HEAD)
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 USER=$(whoami)
 DATETIME=$(date +%Y%m%d-%H%M%S)
 mkdir -p ~/.gstack/projects/$SLUG
@@ -194,5 +193,24 @@ Check the git log for this branch. If there are prior commits suggesting a previ
 * One sentence max per option. Pick in under 5 seconds.
 * After each review section, pause and ask for feedback before moving on.
 
+## Review Log
+
+After producing the Completion Summary above, persist the review result:
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+mkdir -p ~/.gstack/projects/$SLUG
+echo '{"skill":"plan-eng-review","timestamp":"TIMESTAMP","status":"STATUS","unresolved":N,"critical_gaps":N,"mode":"MODE"}' >> ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl
+```
+
+Substitute values from the Completion Summary:
+- **TIMESTAMP**: current ISO 8601 datetime
+- **STATUS**: "clean" if 0 unresolved decisions AND 0 critical gaps; otherwise "issues_open"
+- **unresolved**: number from "Unresolved decisions" count
+- **critical_gaps**: number from "Failure modes: ___ critical gaps flagged"
+- **MODE**: SCOPE_REDUCTION / BIG_CHANGE / SMALL_CHANGE
+
+{{REVIEW_DASHBOARD}}
+
 ## Unresolved decisions
 If the user does not respond to an AskUserQuestion or interrupts to move on, note which decisions were left unresolved. At the end of the review, list these as "Unresolved decisions that may bite you later" — never silently default to an option.
diff --git a/qa-design-review/SKILL.md b/qa-design-review/SKILL.md
index 7fa0b856..0d8d0771 100644
--- a/qa-design-review/SKILL.md
+++ b/qa-design-review/SKILL.md
@@ -396,7 +396,7 @@ Compare screenshots and observations across pages for:
 
 **Project-scoped:**
 ```bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 mkdir -p ~/.gstack/projects/$SLUG
 ```
 Write to: `~/.gstack/projects/{slug}/{user}-{branch}-design-audit-{datetime}.md`
@@ -603,7 +603,7 @@ Write the report to both local and project-scoped locations:
 
 **Project-scoped:**
 ```bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 mkdir -p ~/.gstack/projects/$SLUG
 ```
 Write to `~/.gstack/projects/{slug}/{user}-{branch}-design-audit-{datetime}.md`
diff --git a/qa-design-review/SKILL.md.tmpl b/qa-design-review/SKILL.md.tmpl
index 86e9aab9..0053a494 100644
--- a/qa-design-review/SKILL.md.tmpl
+++ b/qa-design-review/SKILL.md.tmpl
@@ -191,7 +191,7 @@ Write the report to both local and project-scoped locations:
 
 **Project-scoped:**
 ```bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 mkdir -p ~/.gstack/projects/$SLUG
 ```
 Write to `~/.gstack/projects/{slug}/{user}-{branch}-design-audit-{datetime}.md`
diff --git a/qa-only/SKILL.md b/qa-only/SKILL.md
index ed732bf5..36f5fead 100644
--- a/qa-only/SKILL.md
+++ b/qa-only/SKILL.md
@@ -134,7 +134,7 @@ Before falling back to git diff heuristics, check for richer test plan sources:
 
 1. **Project-scoped test plans:** Check `~/.gstack/projects/` for recent `*-test-plan-*.md` files for this repo
    ```bash
-   SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+   eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
    ls -t ~/.gstack/projects/$SLUG/*-test-plan-*.md 2>/dev/null | head -1
    ```
 2. **Conversation context:** Check if a prior `/plan-eng-review` or `/plan-ceo-review` produced test plan output in this conversation
@@ -427,7 +427,7 @@ Write the report to both local and project-scoped locations:
 
 **Project-scoped:** Write test outcome artifact for cross-session context:
 ```bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 mkdir -p ~/.gstack/projects/$SLUG
 ```
 Write to `~/.gstack/projects/{slug}/{user}-{branch}-test-outcome-{datetime}.md`
diff --git a/qa-only/SKILL.md.tmpl b/qa-only/SKILL.md.tmpl
index 5d49e201..101cd71c 100644
--- a/qa-only/SKILL.md.tmpl
+++ b/qa-only/SKILL.md.tmpl
@@ -52,7 +52,7 @@ Before falling back to git diff heuristics, check for richer test plan sources:
 
 1. **Project-scoped test plans:** Check `~/.gstack/projects/` for recent `*-test-plan-*.md` files for this repo
    ```bash
-   SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+   eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
    ls -t ~/.gstack/projects/$SLUG/*-test-plan-*.md 2>/dev/null | head -1
    ```
 2. **Conversation context:** Check if a prior `/plan-eng-review` or `/plan-ceo-review` produced test plan output in this conversation
@@ -72,7 +72,7 @@ Write the report to both local and project-scoped locations:
 
 **Project-scoped:** Write test outcome artifact for cross-session context:
 ```bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 mkdir -p ~/.gstack/projects/$SLUG
 ```
 Write to `~/.gstack/projects/{slug}/{user}-{branch}-test-outcome-{datetime}.md`
diff --git a/qa/SKILL.md b/qa/SKILL.md
index ac12fc94..9bd8fc9b 100644
--- a/qa/SKILL.md
+++ b/qa/SKILL.md
@@ -171,7 +171,7 @@ Before falling back to git diff heuristics, check for richer test plan sources:
 
 1. **Project-scoped test plans:** Check `~/.gstack/projects/` for recent `*-test-plan-*.md` files for this repo
    ```bash
-   SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+   eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
    ls -t ~/.gstack/projects/$SLUG/*-test-plan-*.md 2>/dev/null | head -1
    ```
 2. **Conversation context:** Check if a prior `/plan-eng-review` or `/plan-ceo-review` produced test plan output in this conversation
@@ -579,7 +579,7 @@ Write the report to both local and project-scoped locations:
 
 **Project-scoped:** Write test outcome artifact for cross-session context:
 ```bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 mkdir -p ~/.gstack/projects/$SLUG
 ```
 Write to `~/.gstack/projects/{slug}/{user}-{branch}-test-outcome-{datetime}.md`
diff --git a/qa/SKILL.md.tmpl b/qa/SKILL.md.tmpl
index f491999e..45dfbea6 100644
--- a/qa/SKILL.md.tmpl
+++ b/qa/SKILL.md.tmpl
@@ -72,7 +72,7 @@ Before falling back to git diff heuristics, check for richer test plan sources:
 
 1. **Project-scoped test plans:** Check `~/.gstack/projects/` for recent `*-test-plan-*.md` files for this repo
    ```bash
-   SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+   eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
    ls -t ~/.gstack/projects/$SLUG/*-test-plan-*.md 2>/dev/null | head -1
    ```
 2. **Conversation context:** Check if a prior `/plan-eng-review` or `/plan-ceo-review` produced test plan output in this conversation
@@ -207,7 +207,7 @@ Write the report to both local and project-scoped locations:
 
 **Project-scoped:** Write test outcome artifact for cross-session context:
 ```bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\([^/]*/[^/]*\)\.git$|\1|;s|.*[:/]\([^/]*/[^/]*\)$|\1|' | tr '/' '-')
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 mkdir -p ~/.gstack/projects/$SLUG
 ```
 Write to `~/.gstack/projects/{slug}/{user}-{branch}-test-outcome-{datetime}.md`
diff --git a/scripts/gen-skill-docs.ts b/scripts/gen-skill-docs.ts
index 5d5f84bb..a9d3bce6 100644
--- a/scripts/gen-skill-docs.ts
+++ b/scripts/gen-skill-docs.ts
@@ -730,7 +730,7 @@ Compare screenshots and observations across pages for:
 
 **Project-scoped:**
 \`\`\`bash
-SLUG=$(git remote get-url origin 2>/dev/null | sed 's|.*[:/]\\([^/]*/[^/]*\\)\\.git$|\\1|;s|.*[:/]\\([^/]*/[^/]*\\)$|\\1|' | tr '/' '-')
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 mkdir -p ~/.gstack/projects/$SLUG
 \`\`\`
 Write to: \`~/.gstack/projects/{slug}/{user}-{branch}-design-audit-{datetime}.md\`
@@ -814,6 +814,38 @@ Tie everything to user goals and product objectives. Always suggest specific imp
 11. **Show screenshots to the user.** After every \`$B screenshot\`, \`$B snapshot -a -o\`, or \`$B responsive\` command, use the Read tool on the output file(s) so the user can see them inline. For \`responsive\` (3 files), Read all three. This is critical — without it, screenshots are invisible to the user.`;
 }
 
+function generateReviewDashboard(): string {
+  return `## Review Readiness Dashboard
+
+After completing the review, read the review log to display the dashboard.
+
+\`\`\`bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+cat ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl 2>/dev/null || echo "NO_REVIEWS"
+\`\`\`
+
+Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
+
+\`\`\`
++====================================================================+
+|                    REVIEW READINESS DASHBOARD                       |
++====================================================================+
+| Review          | Runs | Last Run            | Status               |
+|-----------------|------|---------------------|----------------------|
+| CEO Review      |  1   | 2026-03-16 14:30    | CLEAR                |
+| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR                |
+| Design Review   |  0   | —                   | NOT YET RUN          |
++--------------------------------------------------------------------+
+| VERDICT: 2/3 CLEAR — Design Review not yet run                      |
++====================================================================+
+\`\`\`
+
+**Verdict logic:**
+- **CLEARED TO SHIP (3/3)**: All three have >= 1 entry within 7 days AND most recent status is "clean"
+- **N/3 CLEAR**: Show count and list which are missing, have open issues, or are stale (>7 days)
+- Informational only — does NOT block.`;
+}
+
 const RESOLVERS: Record<string, () => string> = {
   COMMAND_REFERENCE: generateCommandReference,
   SNAPSHOT_FLAGS: generateSnapshotFlags,
@@ -822,6 +854,7 @@ const RESOLVERS: Record<string, () => string> = {
   BASE_BRANCH_DETECT: generateBaseBranchDetect,
   QA_METHODOLOGY: generateQAMethodology,
   DESIGN_METHODOLOGY: generateDesignMethodology,
+  REVIEW_DASHBOARD: generateReviewDashboard,
 };
 
 // ─── Template Processing ────────────────────────────────────
diff --git a/ship/SKILL.md b/ship/SKILL.md
index 8aa4a181..e7b8b753 100644
--- a/ship/SKILL.md
+++ b/ship/SKILL.md
@@ -132,6 +132,43 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 
 3. Run `git diff <base>...HEAD --stat` and `git log <base>..HEAD --oneline` to understand what's being shipped.
 
+4. Check review readiness:
+
+## Review Readiness Dashboard
+
+After completing the review, read the review log to display the dashboard.
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+cat ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl 2>/dev/null || echo "NO_REVIEWS"
+```
+
+Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
+
+```
++====================================================================+
+|                    REVIEW READINESS DASHBOARD                       |
++====================================================================+
+| Review          | Runs | Last Run            | Status               |
+|-----------------|------|---------------------|----------------------|
+| CEO Review      |  1   | 2026-03-16 14:30    | CLEAR                |
+| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR                |
+| Design Review   |  0   | —                   | NOT YET RUN          |
++--------------------------------------------------------------------+
+| VERDICT: 2/3 CLEAR — Design Review not yet run                      |
++====================================================================+
+```
+
+**Verdict logic:**
+- **CLEARED TO SHIP (3/3)**: All three have >= 1 entry within 7 days AND most recent status is "clean"
+- **N/3 CLEAR**: Show count and list which are missing, have open issues, or are stale (>7 days)
+- Informational only — does NOT block.
+
+If the verdict is NOT "CLEARED TO SHIP (3/3)", use AskUserQuestion:
+- Show which reviews are missing or have open issues
+- RECOMMENDATION: Choose B (run missing reviews first) unless the change is trivial
+- Options: A) Ship anyway  B) Abort — run missing review(s) first  C) Reviews not relevant for this change
+
 ---
 
 ## Step 2: Merge the base branch (BEFORE tests)
diff --git a/ship/SKILL.md.tmpl b/ship/SKILL.md.tmpl
index 9339e90c..2a24bea3 100644
--- a/ship/SKILL.md.tmpl
+++ b/ship/SKILL.md.tmpl
@@ -50,6 +50,15 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 
 3. Run `git diff <base>...HEAD --stat` and `git log <base>..HEAD --oneline` to understand what's being shipped.
 
+4. Check review readiness:
+
+{{REVIEW_DASHBOARD}}
+
+If the verdict is NOT "CLEARED TO SHIP (3/3)", use AskUserQuestion:
+- Show which reviews are missing or have open issues
+- RECOMMENDATION: Choose B (run missing reviews first) unless the change is trivial
+- Options: A) Ship anyway  B) Abort — run missing review(s) first  C) Reviews not relevant for this change
+
 ---
 
 ## Step 2: Merge the base branch (BEFORE tests)
diff --git a/test/gen-skill-docs.test.ts b/test/gen-skill-docs.test.ts
index def042c9..26de63db 100644
--- a/test/gen-skill-docs.test.ts
+++ b/test/gen-skill-docs.test.ts
@@ -322,3 +322,30 @@ describe('description quality evals', () => {
     expect(tipsSection).not.toContain('->');
   });
 });
+
+describe('REVIEW_DASHBOARD resolver', () => {
+  const REVIEW_SKILLS = ['plan-ceo-review', 'plan-eng-review', 'plan-design-review'];
+
+  for (const skill of REVIEW_SKILLS) {
+    test(`review dashboard appears in ${skill} generated file`, () => {
+      const content = fs.readFileSync(path.join(ROOT, skill, 'SKILL.md'), 'utf-8');
+      expect(content).toContain('reviews.jsonl');
+      expect(content).toContain('REVIEW READINESS DASHBOARD');
+    });
+  }
+
+  test('review dashboard appears in ship generated file', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('reviews.jsonl');
+    expect(content).toContain('REVIEW READINESS DASHBOARD');
+  });
+
+  test('resolver output contains key dashboard elements', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'plan-ceo-review', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('VERDICT');
+    expect(content).toContain('CLEARED TO SHIP');
+    expect(content).toContain('NOT YET RUN');
+    expect(content).toContain('7 days');
+    expect(content).toContain('Design Review');
+  });
+});
diff --git a/test/skill-validation.test.ts b/test/skill-validation.test.ts
index 83cdca6e..78a9bef7 100644
--- a/test/skill-validation.test.ts
+++ b/test/skill-validation.test.ts
@@ -665,3 +665,45 @@ describe('Planted-bug fixture validation', () => {
     expect(content).toContain('update_column');
   });
 });
+
+// --- gstack-slug helper ---
+
+describe('gstack-slug', () => {
+  const SLUG_BIN = path.join(ROOT, 'bin', 'gstack-slug');
+
+  test('binary exists and is executable', () => {
+    expect(fs.existsSync(SLUG_BIN)).toBe(true);
+    const stat = fs.statSync(SLUG_BIN);
+    expect(stat.mode & 0o111).toBeGreaterThan(0);
+  });
+
+  test('outputs SLUG and BRANCH lines in a git repo', () => {
+    const result = Bun.spawnSync([SLUG_BIN], { cwd: ROOT, stdout: 'pipe', stderr: 'pipe' });
+    expect(result.exitCode).toBe(0);
+    const output = result.stdout.toString();
+    expect(output).toContain('SLUG=');
+    expect(output).toContain('BRANCH=');
+  });
+
+  test('SLUG does not contain forward slashes', () => {
+    const result = Bun.spawnSync([SLUG_BIN], { cwd: ROOT, stdout: 'pipe', stderr: 'pipe' });
+    const slug = result.stdout.toString().match(/SLUG=(.*)/)?.[1] ?? '';
+    expect(slug).not.toContain('/');
+    expect(slug.length).toBeGreaterThan(0);
+  });
+
+  test('BRANCH does not contain forward slashes', () => {
+    const result = Bun.spawnSync([SLUG_BIN], { cwd: ROOT, stdout: 'pipe', stderr: 'pipe' });
+    const branch = result.stdout.toString().match(/BRANCH=(.*)/)?.[1] ?? '';
+    expect(branch).not.toContain('/');
+    expect(branch.length).toBeGreaterThan(0);
+  });
+
+  test('output is eval-compatible (KEY=VALUE format)', () => {
+    const result = Bun.spawnSync([SLUG_BIN], { cwd: ROOT, stdout: 'pipe', stderr: 'pipe' });
+    const lines = result.stdout.toString().trim().split('\n');
+    expect(lines.length).toBe(2);
+    expect(lines[0]).toMatch(/^SLUG=.+/);
+    expect(lines[1]).toMatch(/^BRANCH=.+/);
+  });
+});

From c99757b522efaff4011f5210126afc26695b827c Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 10:49:22 -0500
Subject: [PATCH 12/22] =?UTF-8?q?feat:=20/design-consultation=20=E2=80=94?=
 =?UTF-8?q?=20risk-taking,=20visual=20research,=20ambitious=20preview=20(v?=
 =?UTF-8?q?0.5.2)=20(#131)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* feat: /design-consultation — risk-taking thesis, visual research, ambitious preview

Add SAFE/RISK breakdown to design proposals so users see which choices
match category conventions vs. which are deliberate creative departures.

Wire browse binary for visual competitive research — agent browses
competitor sites, takes screenshots, and analyzes fonts/colors/spacing
with graceful degradation to WebSearch-only or built-in knowledge.

Upgrade preview page instructions to render realistic product mockups
(dashboards, marketing pages, settings forms) instead of just swatches.

Rewrite README section with the thesis: "coherence is table stakes —
the real question is where you take risks."

* chore: bump version and changelog (v0.5.2)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* fix: restore SKILL.md files to match main

Prior commit included SKILL.md files regenerated from stale templates.
Restore to match origin/main content.

---------

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 CHANGELOG.md                      |  7 ++-
 README.md                         | 67 +++++++++++++++--------
 VERSION                           |  2 +-
 design-consultation/SKILL.md      | 91 ++++++++++++++++++++++++++-----
 design-consultation/SKILL.md.tmpl | 74 ++++++++++++++++++++-----
 5 files changed, 185 insertions(+), 56 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index a4bd0786..38a4aef0 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,7 +1,12 @@
 # Changelog
 
-## 0.5.1 — 2026-03-17
+## 0.5.2 — 2026-03-17
+
+- **Your design consultant now takes creative risks.** `/design-consultation` doesn't just propose a safe, coherent system — it explicitly breaks down SAFE CHOICES (category baseline) vs. RISKS (where your product stands out). You pick which rules to break. Every risk comes with a rationale for why it works and what it costs.
+- **See the competition before you choose.** When you opt into research, the agent browses competitor sites with screenshots and accessibility tree analysis — not just web search results. You see what the landscape looks like before making design decisions.
+- **Preview pages that look like your product.** The preview page now renders realistic product mockups — dashboards with sidebar nav and data tables, marketing pages with hero sections, settings pages with forms — not just font swatches and color palettes.
 
+## 0.5.1 — 2026-03-17
 - **Know where you stand before you ship.** Every `/plan-ceo-review`, `/plan-eng-review`, and `/plan-design-review` now logs its result to a review tracker. At the end of each review, you see a **Review Readiness Dashboard** showing which reviews are done, when they ran, and whether they're clean — with a clear CLEARED TO SHIP or NOT READY verdict.
 - **`/ship` checks your reviews before creating the PR.** Pre-flight now reads the dashboard and asks if you want to continue when reviews are missing. Informational only — it won't block you, but you'll know what you skipped.
 - **One less thing to copy-paste.** The SLUG computation (that opaque sed pipeline for computing `owner-repo` from git remote) is now a shared `bin/gstack-slug` helper. All 14 inline copies across templates replaced with `eval $(gstack-slug)`. If the format ever changes, fix it once.
diff --git a/README.md b/README.md
index de6144ed..fd4b684f 100644
--- a/README.md
+++ b/README.md
@@ -20,7 +20,7 @@ Thirteen opinionated workflow skills for [Claude Code](https://docs.anthropic.co
 | `/plan-ceo-review` | Founder / CEO | Rethink the problem. Find the 10-star product hiding inside the request. |
 | `/plan-eng-review` | Eng manager / tech lead | Lock in architecture, data flow, diagrams, edge cases, and tests. |
 | `/plan-design-review` | Senior product designer | Designer's eye audit. 80-item checklist, letter grades, AI Slop detection, DESIGN.md inference. Report only — never touches code. |
-| `/design-consultation` | Design consultant | Build a complete design system from scratch. Researches competitors, proposes aesthetic + typography + color + spacing + motion, generates a preview page, and writes DESIGN.md. |
+| `/design-consultation` | Design consultant | Build a complete design system from scratch. Browses competitors to get in the ballpark, proposes safe choices AND creative risks, generates realistic product mockups, and writes DESIGN.md. |
 | `/review` | Paranoid staff engineer | Find the bugs that pass CI but blow up in production. Triages Greptile review comments. |
 | `/ship` | Release engineer | Sync main, run tests, resolve Greptile reviews, push, open PR. For a ready branch, not for deciding what to build. |
 | `/browse` | QA engineer | Give the agent eyes. It logs in, clicks through your app, takes screenshots, catches breakage. Full QA pass in 60 seconds. |
@@ -344,11 +344,15 @@ This is my **design partner mode**.
 
 `/plan-design-review` audits a site that already exists. `/design-consultation` is for when you have nothing yet — no design system, no font choices, no color palette. You are starting from zero and you want a senior designer to sit down with you and build the whole visual identity together.
 
-It is a conversation, not a form. The agent asks about your product, your users, and your space. If you want, it researches what top competitors in your category are doing — fonts, colors, layout patterns, aesthetic direction. Then it proposes a complete, coherent design system: aesthetic direction, typography (3+ fonts with specific roles), color palette with hex values, spacing scale, layout approach, and motion strategy. Every recommendation comes with a rationale. Every choice reinforces every other choice.
+It is a conversation, not a form. The agent asks about your product, your users, and your audience. It thinks about what your product needs to communicate — trust, speed, craft, warmth, whatever fits — and works backward from that to concrete choices. Then it proposes a complete, coherent design system: aesthetic direction, typography (3+ fonts with specific roles), color palette with hex values, spacing scale, layout approach, and motion strategy. Every recommendation comes with a rationale. Every choice reinforces every other choice.
 
-The key insight: individual design decisions are easy to make but hard to make coherently. Picking a font is simple. Picking a font that works with your color palette, your spacing density, your aesthetic direction, and your product's personality — that is the actual job. `/design-consultation` solves the coherence problem by proposing everything as one package, then letting you adjust any piece while it checks that the rest still holds together.
+But coherence is table stakes. Every dev tool dashboard looks the same — clean sans-serif, muted grays, a blue accent. They are all coherent. They are all forgettable. The difference between a product that looks "nice" and one that people actually recognize is the **deliberate creative risks**: the unexpected serif for headings, the bold accent nobody else in your category uses, the tighter spacing that makes your data feel authoritative instead of airy.
 
-After you agree on the system, it generates an interactive HTML preview page — your fonts rendered at real sizes, your color palette as actual UI components (buttons, cards, form inputs, alerts), light/dark mode toggle, all using your product name instead of lorem ipsum. You open the page in your browser and see the design system rendered before a single line of product code is written.
+That is what `/design-consultation` is really about. It does not just propose a safe system. It proposes safe choices AND risks — and tells you which is which. "Here are the choices that keep you literate in your category. And here is where I think you should break from convention, and why." You pick which risks to take. The agent checks that the whole system still coheres either way.
+
+If you want, the agent will browse your competitors' actual sites — take screenshots, analyze their fonts and colors and spacing — so you can see the landscape before you make choices. This is not about copying. It is about getting in the ballpark so you know what the conventions are, and then deciding which ones are worth breaking.
+
+After you agree on the system, it generates an interactive HTML preview page — not just swatches and font samples, but realistic product pages. If you are building a dashboard, you see a dashboard with a sidebar, data tables, and stat cards. If you are building a marketing site, you see a hero section with real copy and a CTA. Everything rendered in your design system, with your product name, in light and dark mode. You see what your product could feel like before a single line of production code is written.
 
 Then it writes `DESIGN.md` to your repo root — your project's design source of truth — and updates `CLAUDE.md` so every future Claude Code session respects the system. From that point on, `/qa-design-review` can audit against it, and any agent working on your frontend knows the rules.
 
@@ -356,44 +360,59 @@ Then it writes `DESIGN.md` to your repo root — your project's design source of
 You:   /design-consultation
 
 Claude: From the README, this looks like a developer analytics dashboard
-        for engineering teams. Sound right? And would you like me to
-        research what other dev tools are doing for design, or should
-        I work from what I know?
+        for engineering teams. Sound right? Tell me about the feeling
+        you want — and would you like me to browse some competitors
+        first so we can see the landscape?
+
+You:    Yes, it's for eng managers. Show me what's out there.
 
-You:    Yes, it's a dashboard for eng managers. Research would be great.
+Claude: [browses Linear, Vercel, Datadog, Posthog — takes screenshots]
 
-Claude: I looked at Linear, Vercel, Railway, Planetscale, and Posthog.
-        They converge on clean sans-serifs and muted palettes, but
-        Linear stands out with its dark-first approach and tight spacing.
-        The gap: most of these feel interchangeable. Here's my proposal:
+        Here's the landscape. They all converge on clean sans-serifs
+        and muted blue-gray palettes. Linear stands out with dark-first
+        and tight spacing. The rest feel interchangeable.
 
-        AESTHETIC: Industrial/Utilitarian — data-first, no decoration tax
+        Here's my proposal — and where I'd play it safe vs. take risks:
+
+        AESTHETIC: Industrial/Utilitarian — data-first, every pixel earns its place
         TYPOGRAPHY: Geist (body + UI), Instrument Serif (display), JetBrains Mono (data)
         COLOR: Restrained — slate neutrals, single teal accent (#0D9488)
         SPACING: 4px base, compact density
         LAYOUT: Grid-disciplined, 12-column
         MOTION: Minimal-functional — only transitions that aid comprehension
 
-        This coheres because the utilitarian aesthetic demands a tight
-        spacing grid and restrained color. The serif display font creates
-        hierarchy contrast without adding visual noise. The monospace for
-        data tables feels native to the engineering audience.
+        SAFE CHOICES (match category expectations):
+          Geist for body — your users already know this font from Vercel
+          Slate neutrals — warm grays feel right for data-heavy UIs
+          Grid-disciplined layout — dashboards need predictable alignment
+
+        RISKS (where you'd stand out):
+          Instrument Serif for display headings — nobody in dev tools
+            uses a serif. It creates instant hierarchy contrast and
+            signals "we care about craft" in a space full of sans-serifs.
+          Single teal accent instead of blue — every competitor uses blue.
+            Teal is close enough to feel trustworthy, different enough
+            to be recognizable.
+          4px compact density — tighter than Linear, says "we respect
+            your screen real estate."
 
-        Want to adjust anything, or should I generate the preview page?
+        The safe choices keep you literate. The risks are where your
+        product gets its own face. Which risks appeal to you?
 
-You:    Generate it.
+You:    Love the serif risk. Let's see it.
 
 Claude: Preview opened in your browser.
         [/tmp/design-consultation-preview-1710000000.html]
 
-        The page shows Instrument Serif at hero scale, Geist in body
-        paragraphs, JetBrains Mono in a sample data table. Color swatches
-        with your teal accent against slate grays. Buttons, cards, and
-        alerts rendered in both light and dark mode.
+        The page shows a realistic dashboard: sidebar nav, header with
+        avatar, stat cards, data table — all in your design system.
+        Instrument Serif at hero scale, Geist in body text, JetBrains
+        Mono in the data table. Teal accent on buttons and active states.
+        Light and dark mode toggle in the corner.
 
         How does it feel? Want to adjust anything before I write DESIGN.md?
 
-You:    Looks great. Ship it.
+You:    Ship it.
 
 Claude: Wrote DESIGN.md (typography, color, spacing, layout, motion).
         Updated CLAUDE.md with design system guidelines.
diff --git a/VERSION b/VERSION
index 4b9fcbec..cb0c939a 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.5.1
+0.5.2
diff --git a/design-consultation/SKILL.md b/design-consultation/SKILL.md
index 0d919950..f04e2213 100644
--- a/design-consultation/SKILL.md
+++ b/design-consultation/SKILL.md
@@ -123,6 +123,29 @@ If brainstorm output exists, read it — the product context is pre-filled.
 
 If the codebase is empty and purpose is unclear, say: *"I don't have a clear picture of what you're building yet. Want to brainstorm first with `/brainstorm`? Once we know the product direction, we can set up the design system."*
 
+**Find the browse binary (optional — enables visual competitive research):**
+
+## SETUP (run this check BEFORE any browse command)
+
+```bash
+_ROOT=$(git rev-parse --show-toplevel 2>/dev/null)
+B=""
+[ -n "$_ROOT" ] && [ -x "$_ROOT/.claude/skills/gstack/browse/dist/browse" ] && B="$_ROOT/.claude/skills/gstack/browse/dist/browse"
+[ -z "$B" ] && B=~/.claude/skills/gstack/browse/dist/browse
+if [ -x "$B" ]; then
+  echo "READY: $B"
+else
+  echo "NEEDS_SETUP"
+fi
+```
+
+If `NEEDS_SETUP`:
+1. Tell the user: "gstack browse needs a one-time build (~10 seconds). OK to proceed?" Then STOP and wait.
+2. Run: `cd <SKILL_DIR> && ./setup`
+3. If `bun` is not installed: `curl -fsSL https://bun.sh/install | bash`
+
+If browse is not available, that's fine — visual research is optional. The skill works without it using WebSearch and your built-in design knowledge.
+
 ---
 
 ## Phase 1: Product Context
@@ -143,17 +166,40 @@ If the README or brainstorm gives you enough context, pre-fill and confirm: *"Fr
 
 If the user wants competitive research:
 
+**Step 1: Identify competitors via WebSearch**
+
 Use WebSearch to find 5-10 products in their space. Search for:
 - "[product category] website design"
 - "[product category] best websites 2025"
 - "best [industry] web apps"
 
-For each competitor found, note: fonts used, color palette, layout approach, aesthetic direction.
+**Step 2: Visual research via browse (if available)**
+
+If the browse binary is available (`$B` is set), visit the top 3-5 competitor sites and capture visual evidence:
 
-Summarize your findings conversationally:
-> "I looked at [competitors]. They tend toward [patterns] — lots of [common choices]. The opportunity to be distinctive is [gap]. Here's what I'd recommend based on this..."
+```bash
+$B goto "https://competitor-site.com"
+$B screenshot "/tmp/design-research-competitor-name.png"
+$B snapshot
+```
 
-If WebSearch is unavailable or returns poor results, fall back gracefully: *"Couldn't get good research results, so I'll work from my design knowledge of the [industry] space."*
+For each competitor, analyze: fonts actually used, color palette, layout approach, spacing density, aesthetic direction. The screenshot gives you the feel; the snapshot gives you structural data.
+
+If a competitor site blocks the headless browser or requires login, skip it and note why.
+
+If browse is not available, rely on WebSearch results and your built-in design knowledge — this is fine.
+
+**Step 3: Synthesize findings**
+
+The goal of research is NOT to copy. It is to get in the ballpark — to understand the visual language users in this category already expect. This gives you the baseline. The interesting design work starts after you have the baseline: deciding where to follow conventions (so the product feels literate) and where to break from them (so the product is memorable).
+
+Summarize conversationally:
+> "I looked at [competitors]. Here's the landscape: they converge on [patterns]. Most of them feel [observation — e.g., interchangeable, polished but generic, etc.]. The opportunity to stand out is [gap]. Here's where I'd play it safe and where I'd take a risk..."
+
+**Graceful degradation:**
+- Browse available → screenshots + snapshots + WebSearch (richest research)
+- Browse unavailable → WebSearch only (still good)
+- WebSearch also unavailable → agent's built-in design knowledge (always works)
 
 If the user said no research, skip entirely and proceed to Phase 3 using your built-in design knowledge.
 
@@ -163,7 +209,7 @@ If the user said no research, skip entirely and proceed to Phase 3 using your bu
 
 This is the soul of the skill. Propose EVERYTHING as one coherent package.
 
-**AskUserQuestion Q2 — present the full proposal:**
+**AskUserQuestion Q2 — present the full proposal with SAFE/RISK breakdown:**
 
 ```
 Based on [product context] and [research findings / my design knowledge]:
@@ -178,12 +224,21 @@ MOTION: [approach] — [rationale]
 
 This system is coherent because [explain how choices reinforce each other].
 
-Want to adjust anything? You can drill into any section, or just tell me
-what feels off and I'll rework it. Or if this looks right, I'll generate
-a preview page so you can see the fonts and colors rendered.
+SAFE CHOICES (category baseline — your users expect these):
+  - [2-3 decisions that match category conventions, with rationale for playing safe]
+
+RISKS (where your product gets its own face):
+  - [2-3 deliberate departures from convention]
+  - For each risk: what it is, why it works, what you gain, what it costs
+
+The safe choices keep you literate in your category. The risks are where
+your product becomes memorable. Which risks appeal to you? Want to see
+different ones? Or adjust anything else?
 ```
 
-**Options:** A) Looks great — generate the preview page. B) I want to adjust [section]. C) Start over with a different direction. D) Skip the preview, just write DESIGN.md.
+The SAFE/RISK breakdown is critical. Design coherence is table stakes — every product in a category can be coherent and still look identical. The real question is: where do you take creative risks? The agent should always propose at least 2 risks, each with a clear rationale for why the risk is worth taking and what the user gives up. Risks might include: an unexpected typeface for the category, a bold accent color nobody else uses, tighter or looser spacing than the norm, a layout approach that breaks from convention, motion choices that add personality.
+
+**Options:** A) Looks great — generate the preview page. B) I want to adjust [section]. C) I want different risks — show me wilder options. D) Start over with a different direction. E) Skip the preview, just write DESIGN.md.
 
 ### Your Design Knowledge (use to inform proposals — do NOT display as tables)
 
@@ -273,7 +328,7 @@ The agent writes a **single, self-contained HTML file** (no framework dependenci
 1. **Loads proposed fonts** from Google Fonts (or Bunny Fonts) via `<link>` tags
 2. **Uses the proposed color palette** throughout — dogfood the design system
 3. **Shows the product name** (not "Lorem Ipsum") as the hero heading
-4. **Font comparison section:**
+4. **Font specimen section:**
    - Each font candidate shown in its proposed role (hero heading, body paragraph, button label, data table row)
    - Side-by-side comparison if multiple candidates for one role
    - Real content that matches the product (e.g., civic tech → government data examples)
@@ -281,11 +336,17 @@ The agent writes a **single, self-contained HTML file** (no framework dependenci
    - Swatches with hex values and names
    - Sample UI components rendered in the palette: buttons (primary, secondary, ghost), cards, form inputs, alerts (success, warning, error, info)
    - Background/text color combinations showing contrast
-6. **Light/dark mode toggle** using CSS custom properties and a JS toggle button
-7. **Clean, professional layout** — the preview page IS a taste signal for the skill
-8. **Responsive** — looks good on any screen width
-
-The page should make the user think "oh nice, they thought of this." It's selling the design system visually, not just listing hex codes.
+6. **Realistic product mockups** — this is what makes the preview page powerful. Based on the project type from Phase 1, render 2-3 realistic page layouts using the full design system:
+   - **Dashboard / web app:** sample data table with metrics, sidebar nav, header with user avatar, stat cards
+   - **Marketing site:** hero section with real copy, feature highlights, testimonial block, CTA
+   - **Settings / admin:** form with labeled inputs, toggle switches, dropdowns, save button
+   - **Auth / onboarding:** login form with social buttons, branding, input validation states
+   - Use the product name, realistic content for the domain, and the proposed spacing/layout/border-radius. The user should see their product (roughly) before writing any code.
+7. **Light/dark mode toggle** using CSS custom properties and a JS toggle button
+8. **Clean, professional layout** — the preview page IS a taste signal for the skill
+9. **Responsive** — looks good on any screen width
+
+The page should make the user think "oh nice, they thought of this." It's selling the design system by showing what the product could feel like, not just listing hex codes and font names.
 
 If `open` fails (headless environment), tell the user: *"I wrote the preview to [path] — open it in your browser to see the fonts and colors rendered."*
 
diff --git a/design-consultation/SKILL.md.tmpl b/design-consultation/SKILL.md.tmpl
index ef5044fb..0ffb121c 100644
--- a/design-consultation/SKILL.md.tmpl
+++ b/design-consultation/SKILL.md.tmpl
@@ -58,6 +58,12 @@ If brainstorm output exists, read it — the product context is pre-filled.
 
 If the codebase is empty and purpose is unclear, say: *"I don't have a clear picture of what you're building yet. Want to brainstorm first with `/brainstorm`? Once we know the product direction, we can set up the design system."*
 
+**Find the browse binary (optional — enables visual competitive research):**
+
+{{BROWSE_SETUP}}
+
+If browse is not available, that's fine — visual research is optional. The skill works without it using WebSearch and your built-in design knowledge.
+
 ---
 
 ## Phase 1: Product Context
@@ -78,17 +84,40 @@ If the README or brainstorm gives you enough context, pre-fill and confirm: *"Fr
 
 If the user wants competitive research:
 
+**Step 1: Identify competitors via WebSearch**
+
 Use WebSearch to find 5-10 products in their space. Search for:
 - "[product category] website design"
 - "[product category] best websites 2025"
 - "best [industry] web apps"
 
-For each competitor found, note: fonts used, color palette, layout approach, aesthetic direction.
+**Step 2: Visual research via browse (if available)**
+
+If the browse binary is available (`$B` is set), visit the top 3-5 competitor sites and capture visual evidence:
+
+```bash
+$B goto "https://competitor-site.com"
+$B screenshot "/tmp/design-research-competitor-name.png"
+$B snapshot
+```
+
+For each competitor, analyze: fonts actually used, color palette, layout approach, spacing density, aesthetic direction. The screenshot gives you the feel; the snapshot gives you structural data.
 
-Summarize your findings conversationally:
-> "I looked at [competitors]. They tend toward [patterns] — lots of [common choices]. The opportunity to be distinctive is [gap]. Here's what I'd recommend based on this..."
+If a competitor site blocks the headless browser or requires login, skip it and note why.
 
-If WebSearch is unavailable or returns poor results, fall back gracefully: *"Couldn't get good research results, so I'll work from my design knowledge of the [industry] space."*
+If browse is not available, rely on WebSearch results and your built-in design knowledge — this is fine.
+
+**Step 3: Synthesize findings**
+
+The goal of research is NOT to copy. It is to get in the ballpark — to understand the visual language users in this category already expect. This gives you the baseline. The interesting design work starts after you have the baseline: deciding where to follow conventions (so the product feels literate) and where to break from them (so the product is memorable).
+
+Summarize conversationally:
+> "I looked at [competitors]. Here's the landscape: they converge on [patterns]. Most of them feel [observation — e.g., interchangeable, polished but generic, etc.]. The opportunity to stand out is [gap]. Here's where I'd play it safe and where I'd take a risk..."
+
+**Graceful degradation:**
+- Browse available → screenshots + snapshots + WebSearch (richest research)
+- Browse unavailable → WebSearch only (still good)
+- WebSearch also unavailable → agent's built-in design knowledge (always works)
 
 If the user said no research, skip entirely and proceed to Phase 3 using your built-in design knowledge.
 
@@ -98,7 +127,7 @@ If the user said no research, skip entirely and proceed to Phase 3 using your bu
 
 This is the soul of the skill. Propose EVERYTHING as one coherent package.
 
-**AskUserQuestion Q2 — present the full proposal:**
+**AskUserQuestion Q2 — present the full proposal with SAFE/RISK breakdown:**
 
 ```
 Based on [product context] and [research findings / my design knowledge]:
@@ -113,12 +142,21 @@ MOTION: [approach] — [rationale]
 
 This system is coherent because [explain how choices reinforce each other].
 
-Want to adjust anything? You can drill into any section, or just tell me
-what feels off and I'll rework it. Or if this looks right, I'll generate
-a preview page so you can see the fonts and colors rendered.
+SAFE CHOICES (category baseline — your users expect these):
+  - [2-3 decisions that match category conventions, with rationale for playing safe]
+
+RISKS (where your product gets its own face):
+  - [2-3 deliberate departures from convention]
+  - For each risk: what it is, why it works, what you gain, what it costs
+
+The safe choices keep you literate in your category. The risks are where
+your product becomes memorable. Which risks appeal to you? Want to see
+different ones? Or adjust anything else?
 ```
 
-**Options:** A) Looks great — generate the preview page. B) I want to adjust [section]. C) Start over with a different direction. D) Skip the preview, just write DESIGN.md.
+The SAFE/RISK breakdown is critical. Design coherence is table stakes — every product in a category can be coherent and still look identical. The real question is: where do you take creative risks? The agent should always propose at least 2 risks, each with a clear rationale for why the risk is worth taking and what the user gives up. Risks might include: an unexpected typeface for the category, a bold accent color nobody else uses, tighter or looser spacing than the norm, a layout approach that breaks from convention, motion choices that add personality.
+
+**Options:** A) Looks great — generate the preview page. B) I want to adjust [section]. C) I want different risks — show me wilder options. D) Start over with a different direction. E) Skip the preview, just write DESIGN.md.
 
 ### Your Design Knowledge (use to inform proposals — do NOT display as tables)
 
@@ -208,7 +246,7 @@ The agent writes a **single, self-contained HTML file** (no framework dependenci
 1. **Loads proposed fonts** from Google Fonts (or Bunny Fonts) via `<link>` tags
 2. **Uses the proposed color palette** throughout — dogfood the design system
 3. **Shows the product name** (not "Lorem Ipsum") as the hero heading
-4. **Font comparison section:**
+4. **Font specimen section:**
    - Each font candidate shown in its proposed role (hero heading, body paragraph, button label, data table row)
    - Side-by-side comparison if multiple candidates for one role
    - Real content that matches the product (e.g., civic tech → government data examples)
@@ -216,11 +254,17 @@ The agent writes a **single, self-contained HTML file** (no framework dependenci
    - Swatches with hex values and names
    - Sample UI components rendered in the palette: buttons (primary, secondary, ghost), cards, form inputs, alerts (success, warning, error, info)
    - Background/text color combinations showing contrast
-6. **Light/dark mode toggle** using CSS custom properties and a JS toggle button
-7. **Clean, professional layout** — the preview page IS a taste signal for the skill
-8. **Responsive** — looks good on any screen width
-
-The page should make the user think "oh nice, they thought of this." It's selling the design system visually, not just listing hex codes.
+6. **Realistic product mockups** — this is what makes the preview page powerful. Based on the project type from Phase 1, render 2-3 realistic page layouts using the full design system:
+   - **Dashboard / web app:** sample data table with metrics, sidebar nav, header with user avatar, stat cards
+   - **Marketing site:** hero section with real copy, feature highlights, testimonial block, CTA
+   - **Settings / admin:** form with labeled inputs, toggle switches, dropdowns, save button
+   - **Auth / onboarding:** login form with social buttons, branding, input validation states
+   - Use the product name, realistic content for the domain, and the proposed spacing/layout/border-radius. The user should see their product (roughly) before writing any code.
+7. **Light/dark mode toggle** using CSS custom properties and a JS toggle button
+8. **Clean, professional layout** — the preview page IS a taste signal for the skill
+9. **Responsive** — looks good on any screen width
+
+The page should make the user think "oh nice, they thought of this." It's selling the design system by showing what the product could feel like, not just listing hex codes and font names.
 
 If `open` fails (headless environment), tell the user: *"I wrote the preview to [path] — open it in your browser to see the fonts and colors rendered."*
 

From 5e9f0e78f293c55e80198e2e931be35597ad0cbb Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 12:22:10 -0500
Subject: [PATCH 13/22] feat: SELECTIVE EXPANSION + smarter ship gates (v0.5.3)
 (#134)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* feat: SELECTIVE EXPANSION mode + user control for CEO review

Add 4th mode to /plan-ceo-review: SELECTIVE EXPANSION holds current scope
as baseline but surfaces expansion opportunities one by one for cherry-picking.
All modes now present every scope-expanding idea as individual AskUserQuestion
calls — user opts in or out of each one. EXPANSION recommends enthusiastically,
SELECTIVE recommends neutrally. CEO plan persistence writes decisions to disk.

* feat: review dashboard — eng required, CEO/design optional

Only Eng Review gates shipping. CEO Review recommended for big product
changes, Design Review for UI work — both informational only. Adds
skip_eng_review global config to disable the gate entirely.

* chore: bump version and changelog (v0.5.3)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 CHANGELOG.md                  |  18 +++
 VERSION                       |   2 +-
 plan-ceo-review/SKILL.md      | 219 ++++++++++++++++++++++++----------
 plan-ceo-review/SKILL.md.tmpl | 191 +++++++++++++++++++++--------
 plan-design-review/SKILL.md   |  28 +++--
 plan-eng-review/SKILL.md      |  28 +++--
 scripts/gen-skill-docs.ts     |  28 +++--
 ship/SKILL.md                 |  39 +++---
 ship/SKILL.md.tmpl            |   9 +-
 test/gen-skill-docs.test.ts   |   5 +-
 test/skill-e2e.test.ts        |  83 +++++++++++++
 test/skill-validation.test.ts |  30 +++++
 12 files changed, 518 insertions(+), 162 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 38a4aef0..a61be2db 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,23 @@
 # Changelog
 
+## 0.5.3 — 2026-03-17
+
+- **You're always in control — even when dreaming big.** `/plan-ceo-review` now presents every scope expansion as an individual decision you opt into. EXPANSION mode recommends enthusiastically, but you say yes or no to each idea. No more "the agent went wild and added 5 features I didn't ask for."
+- **New mode: SELECTIVE EXPANSION.** Hold your current scope as the baseline, but see what else is possible. The agent surfaces expansion opportunities one by one with neutral recommendations — you cherry-pick the ones worth doing. Perfect for iterating on existing features where you want rigor but also want to be tempted by adjacent improvements.
+- **Your CEO review visions are saved, not lost.** Expansion ideas, cherry-pick decisions, and 10x visions are now persisted to `~/.gstack/projects/{repo}/ceo-plans/` as structured design documents. Stale plans get archived automatically. If a vision is exceptional, you can promote it to `docs/designs/` in your repo for the team.
+
+- **Smarter ship gates.** `/ship` no longer nags you about CEO and Design reviews when they're not relevant. Eng Review is the only required gate (and you can disable even that with `gstack-config set skip_eng_review true`). CEO Review is recommended for big product changes; Design Review for UI work. The dashboard still shows all three — it just won't block you for the optional ones.
+
+### For contributors
+
+- Added SELECTIVE EXPANSION mode to `plan-ceo-review/SKILL.md.tmpl` with cherry-pick ceremony, neutral recommendation posture, and HOLD SCOPE baseline.
+- Rewrote EXPANSION mode's Step 0D to include opt-in ceremony — distill vision into discrete proposals, present each as AskUserQuestion.
+- Added CEO plan persistence (0D-POST step): structured markdown with YAML frontmatter (`status: ACTIVE/ARCHIVED/PROMOTED`), scope decisions table, archival flow.
+- Added `docs/designs` promotion step after Review Log.
+- Mode Quick Reference table expanded to 4 columns.
+- Review Readiness Dashboard: Eng Review required (overridable via `skip_eng_review` config), CEO/Design optional with agent judgment.
+- New tests: CEO review mode validation (4 modes, persistence, promotion), SELECTIVE EXPANSION E2E test.
+
 ## 0.5.2 — 2026-03-17
 
 - **Your design consultant now takes creative risks.** `/design-consultation` doesn't just propose a safe, coherent system — it explicitly breaks down SAFE CHOICES (category baseline) vs. RISKS (where your product stands out). You pick which rules to break. Every risk comes with a rationale for why it works and what it costs.
diff --git a/VERSION b/VERSION
index cb0c939a..be14282b 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.5.2
+0.5.3
diff --git a/plan-ceo-review/SKILL.md b/plan-ceo-review/SKILL.md
index 033f4e5f..7f48cbe7 100644
--- a/plan-ceo-review/SKILL.md
+++ b/plan-ceo-review/SKILL.md
@@ -3,9 +3,9 @@ name: plan-ceo-review
 version: 1.0.0
 description: |
   CEO/founder-mode plan review. Rethink the problem, find the 10-star product,
-  challenge premises, expand scope when it creates a better product. Three modes:
-  SCOPE EXPANSION (dream big), HOLD SCOPE (maximum rigor), SCOPE REDUCTION
-  (strip to essentials).
+  challenge premises, expand scope when it creates a better product. Four modes:
+  SCOPE EXPANSION (dream big), SELECTIVE EXPANSION (hold scope + cherry-pick
+  expansions), HOLD SCOPE (maximum rigor), SCOPE REDUCTION (strip to essentials).
 allowed-tools:
   - Read
   - Grep
@@ -105,10 +105,11 @@ branch name wherever the instructions say "the base branch."
 ## Philosophy
 You are not here to rubber-stamp this plan. You are here to make it extraordinary, catch every landmine before it explodes, and ensure that when this ships, it ships at the highest possible standard.
 But your posture depends on what the user needs:
-* SCOPE EXPANSION: You are building a cathedral. Envision the platonic ideal. Push scope UP. Ask "what would make this 10x better for 2x the effort?" The answer to "should we also build X?" is "yes, if it serves the vision." You have permission to dream.
+* SCOPE EXPANSION: You are building a cathedral. Envision the platonic ideal. Push scope UP. Ask "what would make this 10x better for 2x the effort?" You have permission to dream — and to recommend enthusiastically. But every expansion is the user's decision. Present each scope-expanding idea as an AskUserQuestion. The user opts in or out.
+* SELECTIVE EXPANSION: You are a rigorous reviewer who also has taste. Hold the current scope as your baseline — make it bulletproof. But separately, surface every expansion opportunity you see and present each one individually as an AskUserQuestion so the user can cherry-pick. Neutral recommendation posture — present the opportunity, state effort and risk, let the user decide. Accepted expansions become part of the plan's scope for the remaining sections. Rejected ones go to "NOT in scope."
 * HOLD SCOPE: You are a rigorous reviewer. The plan's scope is accepted. Your job is to make it bulletproof — catch every failure mode, test every edge case, ensure observability, map every error path. Do not silently reduce OR expand.
 * SCOPE REDUCTION: You are a surgeon. Find the minimum viable version that achieves the core outcome. Cut everything else. Be ruthless.
-Critical rule: Once the user selects a mode, COMMIT to it. Do not silently drift toward a different mode. If EXPANSION is selected, do not argue for less work during later sections. If REDUCTION is selected, do not sneak scope back in. Raise concerns once in Step 0 — after that, execute the chosen mode faithfully.
+Critical rule: In ALL modes, the user is 100% in control. Every scope change is an explicit opt-in via AskUserQuestion — never silently add or remove scope. Once the user selects a mode, COMMIT to it. Do not silently drift toward a different mode. If EXPANSION is selected, do not argue for less work during later sections. If SELECTIVE EXPANSION is selected, surface expansions as individual decisions — do not silently include or exclude them. If REDUCTION is selected, do not sneak scope back in. Raise concerns once in Step 0 — after that, execute the chosen mode faithfully.
 Do NOT make any code changes. Do NOT start implementation. Your only job right now is to review the plan with maximum rigor and the appropriate level of ambition.
 
 ## Prime Directives
@@ -164,7 +165,7 @@ Map:
 ### Retrospective Check
 Check the git log for this branch. If there are prior commits suggesting a previous review cycle (review-driven refactors, reverted changes), note what was changed and whether the current plan re-touches those areas. Be MORE aggressive reviewing areas that were previously problematic. Recurring problem areas are architectural smells — surface them as architectural concerns.
 
-### Taste Calibration (EXPANSION mode only)
+### Taste Calibration (EXPANSION and SELECTIVE EXPANSION modes)
 Identify 2-3 files or patterns in the existing codebase that are particularly well-designed. Note them as style references for the review. Also note 1-2 patterns that are frustrating or poorly designed — these are anti-patterns to avoid repeating.
 Report findings before proceeding to Step 0.
 
@@ -187,10 +188,20 @@ Describe the ideal end state of this system 12 months from now. Does this plan m
 ```
 
 ### 0D. Mode-Specific Analysis
-**For SCOPE EXPANSION** — run all three:
+**For SCOPE EXPANSION** — run all three, then the opt-in ceremony:
 1. 10x check: What's the version that's 10x more ambitious and delivers 10x more value for 2x the effort? Describe it concretely.
 2. Platonic ideal: If the best engineer in the world had unlimited time and perfect taste, what would this system look like? What would the user feel when using it? Start from experience, not architecture.
-3. Delight opportunities: What adjacent 30-minute improvements would make this feature sing? Things where a user would think "oh nice, they thought of that." List at least 3.
+3. Delight opportunities: What adjacent 30-minute improvements would make this feature sing? Things where a user would think "oh nice, they thought of that." List at least 5.
+4. **Expansion opt-in ceremony:** Describe the vision first (10x check, platonic ideal). Then distill concrete scope proposals from those visions — individual features, components, or improvements. Present each proposal as its own AskUserQuestion. Recommend enthusiastically — explain why it's worth doing. But the user decides. Options: **A)** Add to this plan's scope **B)** Defer to TODOS.md **C)** Skip. Accepted items become plan scope for all remaining review sections. Rejected items go to "NOT in scope."
+
+**For SELECTIVE EXPANSION** — run the HOLD SCOPE analysis first, then surface expansions:
+1. Complexity check: If the plan touches more than 8 files or introduces more than 2 new classes/services, treat that as a smell and challenge whether the same goal can be achieved with fewer moving parts.
+2. What is the minimum set of changes that achieves the stated goal? Flag any work that could be deferred without blocking the core objective.
+3. Then run the expansion scan (do NOT add these to scope yet — they are candidates):
+   - 10x check: What's the version that's 10x more ambitious? Describe it concretely.
+   - Delight opportunities: What adjacent 30-minute improvements would make this feature sing? List at least 5.
+   - Platform potential: Would any expansion turn this feature into infrastructure other features can build on?
+4. **Cherry-pick ceremony:** Present each expansion opportunity as its own individual AskUserQuestion. Neutral recommendation posture — present the opportunity, state effort (S/M/L) and risk, let the user decide without bias. Options: **A)** Add to this plan's scope **B)** Defer to TODOS.md **C)** Skip. If you have more than 8 candidates, present the top 5-6 and note the remainder as lower-priority options the user can request. Accepted items become plan scope for all remaining review sections. Rejected items go to "NOT in scope."
 
 **For HOLD SCOPE** — run this:
 1. Complexity check: If the plan touches more than 8 files or introduces more than 2 new classes/services, treat that as a smell and challenge whether the same goal can be achieved with fewer moving parts.
@@ -200,7 +211,57 @@ Describe the ideal end state of this system 12 months from now. Does this plan m
 1. Ruthless cut: What is the absolute minimum that ships value to a user? Everything else is deferred. No exceptions.
 2. What can be a follow-up PR? Separate "must ship together" from "nice to ship together."
 
-### 0E. Temporal Interrogation (EXPANSION and HOLD modes)
+### 0D-POST. Persist CEO Plan (EXPANSION and SELECTIVE EXPANSION only)
+
+After the opt-in/cherry-pick ceremony, write the plan to disk so the vision and decisions survive beyond this conversation. Only run this step for EXPANSION and SELECTIVE EXPANSION modes.
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+mkdir -p ~/.gstack/projects/$SLUG/ceo-plans
+```
+
+Before writing, check for existing CEO plans in the ceo-plans/ directory. If any are >30 days old or their branch has been merged/deleted, offer to archive them:
+
+```bash
+mkdir -p ~/.gstack/projects/$SLUG/ceo-plans/archive
+# For each stale plan: mv ~/.gstack/projects/$SLUG/ceo-plans/{old-plan}.md ~/.gstack/projects/$SLUG/ceo-plans/archive/
+```
+
+Write to `~/.gstack/projects/$SLUG/ceo-plans/{date}-{feature-slug}.md` using this format:
+
+```markdown
+---
+status: ACTIVE
+---
+# CEO Plan: {Feature Name}
+Generated by /plan-ceo-review on {date}
+Branch: {branch} | Mode: {EXPANSION / SELECTIVE EXPANSION}
+Repo: {owner/repo}
+
+## Vision
+
+### 10x Check
+{10x vision description}
+
+### Platonic Ideal
+{platonic ideal description — EXPANSION mode only}
+
+## Scope Decisions
+
+| # | Proposal | Effort | Decision | Reasoning |
+|---|----------|--------|----------|-----------|
+| 1 | {proposal} | S/M/L | ACCEPTED / DEFERRED / SKIPPED | {why} |
+
+## Accepted Scope (added to this plan)
+- {bullet list of what's now in scope}
+
+## Deferred to TODOS.md
+- {items with context}
+```
+
+Derive the feature slug from the plan being reviewed (e.g., "user-dashboard", "auth-refactor"). Use the date in YYYY-MM-DD format.
+
+### 0E. Temporal Interrogation (EXPANSION, SELECTIVE EXPANSION, and HOLD modes)
 Think ahead to implementation: What decisions will need to be made during implementation that should be resolved NOW in the plan?
 ```
   HOUR 1 (foundations):     What does the implementer need to know?
@@ -211,17 +272,22 @@ Think ahead to implementation: What decisions will need to be made during implem
 Surface these as questions for the user NOW, not as "figure it out later."
 
 ### 0F. Mode Selection
-Present three options:
-1. **SCOPE EXPANSION:** The plan is good but could be great. Propose the ambitious version, then review that. Push scope up. Build the cathedral.
-2. **HOLD SCOPE:** The plan's scope is right. Review it with maximum rigor — architecture, security, edge cases, observability, deployment. Make it bulletproof.
-3. **SCOPE REDUCTION:** The plan is overbuilt or wrong-headed. Propose a minimal version that achieves the core goal, then review that.
+In every mode, you are 100% in control. No scope is added without your explicit approval.
+
+Present four options:
+1. **SCOPE EXPANSION:** The plan is good but could be great. Dream big — propose the ambitious version. Every expansion is presented individually for your approval. You opt in to each one.
+2. **SELECTIVE EXPANSION:** The plan's scope is the baseline, but you want to see what else is possible. Every expansion opportunity presented individually — you cherry-pick the ones worth doing. Neutral recommendations.
+3. **HOLD SCOPE:** The plan's scope is right. Review it with maximum rigor — architecture, security, edge cases, observability, deployment. Make it bulletproof. No expansions surfaced.
+4. **SCOPE REDUCTION:** The plan is overbuilt or wrong-headed. Propose a minimal version that achieves the core goal, then review that.
 
 Context-dependent defaults:
 * Greenfield feature → default EXPANSION
+* Feature enhancement or iteration on existing system → default SELECTIVE EXPANSION
 * Bug fix or hotfix → default HOLD SCOPE
 * Refactor → default HOLD SCOPE
 * Plan touching >15 files → suggest REDUCTION unless user pushes back
 * User says "go big" / "ambitious" / "cathedral" → EXPANSION, no question
+* User says "hold scope but tempt me" / "show me options" / "cherry-pick" → SELECTIVE EXPANSION, no question
 
 Once selected, commit fully. Do not silently drift.
 **STOP.** AskUserQuestion once per issue. Do NOT batch. Recommend + WHY. If no issues or fix is obvious, state what you'll do and move on — don't waste a question. Do NOT proceed until user responds.
@@ -244,10 +310,12 @@ Evaluate and diagram:
 * Production failure scenarios. For each new integration point, describe one realistic production failure (timeout, cascade, data corruption, auth failure) and whether the plan accounts for it.
 * Rollback posture. If this ships and immediately breaks, what's the rollback procedure? Git revert? Feature flag? DB migration rollback? How long?
 
-**EXPANSION mode additions:**
+**EXPANSION and SELECTIVE EXPANSION additions:**
 * What would make this architecture beautiful? Not just correct — elegant. Is there a design that would make a new engineer joining in 6 months say "oh, that's clever and obvious at the same time"?
 * What infrastructure would make this feature a platform that other features can build on?
 
+**SELECTIVE EXPANSION:** If any accepted cherry-picks from Step 0D affect the architecture, evaluate their architectural fit here. Flag any that create coupling concerns or don't integrate cleanly — this is a chance to revisit the decision with new information.
+
 Required ASCII diagram: full system architecture showing new components and their relationships to existing ones.
 **STOP.** AskUserQuestion once per issue. Do NOT batch. Recommend + WHY. If no issues or fix is obvious, state what you'll do and move on — don't waste a question. Do NOT proceed until user responds.
 
@@ -406,8 +474,8 @@ Evaluate:
 * Admin tooling. New operational tasks that need admin UI or rake tasks?
 * Runbooks. For each new failure mode: what's the operational response?
 
-**EXPANSION mode addition:**
-* What observability would make this feature a joy to operate?
+**EXPANSION and SELECTIVE EXPANSION addition:**
+* What observability would make this feature a joy to operate? (For SELECTIVE EXPANSION, include observability for any accepted cherry-picks.)
 **STOP.** AskUserQuestion once per issue. Do NOT batch. Recommend + WHY. If no issues or fix is obvious, state what you'll do and move on — don't waste a question. Do NOT proceed until user responds.
 
 ### Section 9: Deployment & Rollout Review
@@ -421,8 +489,8 @@ Evaluate:
 * Post-deploy verification checklist. First 5 minutes? First hour?
 * Smoke tests. What automated checks should run immediately post-deploy?
 
-**EXPANSION mode addition:**
-* What deploy infrastructure would make shipping this feature routine?
+**EXPANSION and SELECTIVE EXPANSION addition:**
+* What deploy infrastructure would make shipping this feature routine? (For SELECTIVE EXPANSION, assess whether accepted cherry-picks change the deployment risk profile.)
 **STOP.** AskUserQuestion once per issue. Do NOT batch. Recommend + WHY. If no issues or fix is obvious, state what you'll do and move on — don't waste a question. Do NOT proceed until user responds.
 
 ### Section 10: Long-Term Trajectory Review
@@ -434,9 +502,10 @@ Evaluate:
 * Ecosystem fit. Aligns with Rails/JS ecosystem direction?
 * The 1-year question. Read this plan as a new engineer in 12 months — obvious?
 
-**EXPANSION mode additions:**
+**EXPANSION and SELECTIVE EXPANSION additions:**
 * What comes after this ships? Phase 2? Phase 3? Does the architecture support that trajectory?
 * Platform potential. Does this create capabilities other features can leverage?
+* (SELECTIVE EXPANSION only) Retrospective: Were the right cherry-picks accepted? Did any rejected expansions turn out to be load-bearing for the accepted ones?
 **STOP.** AskUserQuestion once per issue. Do NOT batch. Recommend + WHY. If no issues or fix is obvious, state what you'll do and move on — don't waste a question. Do NOT proceed until user responds.
 
 ## CRITICAL RULE — How to ask questions
@@ -485,8 +554,11 @@ For each TODO, describe:
 
 Then present options: **A)** Add to TODOS.md **B)** Skip — not valuable enough **C)** Build it now in this PR instead of deferring.
 
-### Delight Opportunities (EXPANSION mode only)
-Identify at least 5 "bonus chunk" opportunities (<30 min each) that would make users think "oh nice, they thought of that." Present each delight opportunity as its own individual AskUserQuestion. Never batch them. For each one, describe what it is, why it would delight users, and effort estimate. Then present options: **A)** Add to TODOS.md as a vision item **B)** Skip **C)** Build it now in this PR.
+### Scope Expansion Decisions (EXPANSION and SELECTIVE EXPANSION only)
+For EXPANSION and SELECTIVE EXPANSION modes: expansion opportunities and delight items were surfaced and decided in Step 0D (opt-in/cherry-pick ceremony). The decisions are persisted in the CEO plan document. Reference the CEO plan for the full record. Do not re-surface them here — list the accepted expansions for completeness:
+* Accepted: {list items added to scope}
+* Deferred: {list items sent to TODOS.md}
+* Skipped: {list items rejected}
 
 ### Diagrams (mandatory, produce all that apply)
 1. System architecture
@@ -504,7 +576,7 @@ List every ASCII diagram in files this plan touches. Still accurate?
   +====================================================================+
   |            MEGA PLAN REVIEW — COMPLETION SUMMARY                   |
   +====================================================================+
-  | Mode selected        | EXPANSION / HOLD / REDUCTION                |
+  | Mode selected        | EXPANSION / SELECTIVE / HOLD / REDUCTION     |
   | System Audit         | [key findings]                              |
   | Step 0               | [mode + key decisions]                      |
   | Section 1  (Arch)    | ___ issues found                            |
@@ -524,7 +596,8 @@ List every ASCII diagram in files this plan touches. Still accurate?
   | Error/rescue registry| ___ methods, ___ CRITICAL GAPS              |
   | Failure modes        | ___ total, ___ CRITICAL GAPS                |
   | TODOS.md updates     | ___ items proposed                          |
-  | Delight opportunities| ___ identified (EXPANSION only)             |
+  | Scope proposals      | ___ proposed, ___ accepted (EXP + SEL)      |
+  | CEO plan             | written / skipped (HOLD/REDUCTION)           |
   | Diagrams produced    | ___ (list types)                            |
   | Stale diagrams found | ___                                         |
   | Unresolved decisions | ___ (listed below)                          |
@@ -549,15 +622,17 @@ Before running this command, substitute the placeholder values from the Completi
 - **STATUS**: "clean" if 0 unresolved decisions AND 0 critical gaps; otherwise "issues_open"
 - **unresolved**: number from "Unresolved decisions" in the summary
 - **critical_gaps**: number from "Failure modes: ___ CRITICAL GAPS" in the summary
-- **MODE**: the mode the user selected (SCOPE_EXPANSION / HOLD_SCOPE / SCOPE_REDUCTION)
+- **MODE**: the mode the user selected (SCOPE_EXPANSION / SELECTIVE_EXPANSION / HOLD_SCOPE / SCOPE_REDUCTION)
 
 ## Review Readiness Dashboard
 
-After completing the review, read the review log to display the dashboard.
+After completing the review, read the review log and config to display the dashboard.
 
 ```bash
 eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 cat ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl 2>/dev/null || echo "NO_REVIEWS"
+echo "---CONFIG---"
+~/.claude/skills/gstack/bin/gstack-config get skip_eng_review 2>/dev/null || echo "false"
 ```
 
 Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
@@ -566,20 +641,37 @@ Parse the output. Find the most recent entry for each skill (plan-ceo-review, pl
 +====================================================================+
 |                    REVIEW READINESS DASHBOARD                       |
 +====================================================================+
-| Review          | Runs | Last Run            | Status               |
-|-----------------|------|---------------------|----------------------|
-| CEO Review      |  1   | 2026-03-16 14:30    | CLEAR                |
-| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR                |
-| Design Review   |  0   | —                   | NOT YET RUN          |
+| Review          | Runs | Last Run            | Status    | Required |
+|-----------------|------|---------------------|-----------|----------|
+| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR     | YES      |
+| CEO Review      |  0   | —                   | —         | no       |
+| Design Review   |  0   | —                   | —         | no       |
 +--------------------------------------------------------------------+
-| VERDICT: 2/3 CLEAR — Design Review not yet run                      |
+| VERDICT: CLEARED — Eng Review passed                                |
 +====================================================================+
 ```
 
+**Review tiers:**
+- **Eng Review (required by default):** The only review that gates shipping. Covers architecture, code quality, tests, performance. Can be disabled globally with \`gstack-config set skip_eng_review true\` (the "don't bother me" setting).
+- **CEO Review (optional):** Use your judgment. Recommend it for big product/business changes, new user-facing features, or scope decisions. Skip for bug fixes, refactors, infra, and cleanup.
+- **Design Review (optional):** Use your judgment. Recommend it for UI/UX changes. Skip for backend-only, infra, or prompt-only changes.
+
 **Verdict logic:**
-- **CLEARED TO SHIP (3/3)**: All three have >= 1 entry within 7 days AND most recent status is "clean"
-- **N/3 CLEAR**: Show count and list which are missing, have open issues, or are stale (>7 days)
-- Informational only — does NOT block.
+- **CLEARED**: Eng Review has >= 1 entry within 7 days with status "clean" (or \`skip_eng_review\` is \`true\`)
+- **NOT CLEARED**: Eng Review missing, stale (>7 days), or has open issues
+- CEO and Design reviews are shown for context but never block shipping
+- If \`skip_eng_review\` config is \`true\`, Eng Review shows "SKIPPED (global)" and verdict is CLEARED
+
+## docs/designs Promotion (EXPANSION and SELECTIVE EXPANSION only)
+
+At the end of the review, if the vision produced a compelling feature direction, offer to promote the CEO plan to the project repo. AskUserQuestion:
+
+"The vision from this review produced {N} accepted scope expansions. Want to promote it to a design doc in the repo?"
+- **A)** Promote to `docs/designs/{FEATURE}.md` (committed to repo, visible to the team)
+- **B)** Keep in `~/.gstack/projects/` only (local, personal reference)
+- **C)** Skip
+
+If promoted, copy the CEO plan content to `docs/designs/{FEATURE}.md` (create the directory if needed) and update the `status` field in the original CEO plan from `ACTIVE` to `PROMOTED`.
 
 ## Formatting Rules
 * NUMBER issues (1, 2, 3...) and LETTERS for options (A, B, C...).
@@ -590,30 +682,37 @@ Parse the output. Find the most recent entry for each skill (plan-ceo-review, pl
 
 ## Mode Quick Reference
 ```
-  ┌─────────────────────────────────────────────────────────────────┐
-  │                     MODE COMPARISON                             │
-  ├─────────────┬──────────────┬──────────────┬────────────────────┤
-  │             │  EXPANSION   │  HOLD SCOPE  │  REDUCTION         │
-  ├─────────────┼──────────────┼──────────────┼────────────────────┤
-  │ Scope       │ Push UP      │ Maintain     │ Push DOWN          │
-  │ 10x check   │ Mandatory    │ Optional     │ Skip               │
-  │ Platonic    │ Yes          │ No           │ No                 │
-  │ ideal       │              │              │                    │
-  │ Delight     │ 5+ items     │ Note if seen │ Skip               │
-  │ opps        │              │              │                    │
-  │ Complexity  │ "Is it big   │ "Is it too   │ "Is it the bare    │
-  │ question    │  enough?"    │  complex?"   │  minimum?"         │
-  │ Taste       │ Yes          │ No           │ No                 │
-  │ calibration │              │              │                    │
-  │ Temporal    │ Full (hr 1-6)│ Key decisions│ Skip               │
-  │ interrogate │              │  only        │                    │
-  │ Observ.     │ "Joy to      │ "Can we      │ "Can we see if     │
-  │ standard    │  operate"    │  debug it?"  │  it's broken?"     │
-  │ Deploy      │ Infra as     │ Safe deploy  │ Simplest possible  │
-  │ standard    │ feature scope│  + rollback  │  deploy            │
-  │ Error map   │ Full + chaos │ Full         │ Critical paths     │
-  │             │  scenarios   │              │  only              │
-  │ Phase 2/3   │ Map it       │ Note it      │ Skip               │
-  │ planning    │              │              │                    │
-  └─────────────┴──────────────┴──────────────┴────────────────────┘
+  ┌────────────────────────────────────────────────────────────────────────────────┐
+  │                            MODE COMPARISON                                     │
+  ├─────────────┬──────────────┬──────────────┬──────────────┬────────────────────┤
+  │             │  EXPANSION   │  SELECTIVE   │  HOLD SCOPE  │  REDUCTION         │
+  ├─────────────┼──────────────┼──────────────┼──────────────┼────────────────────┤
+  │ Scope       │ Push UP      │ Hold + offer │ Maintain     │ Push DOWN          │
+  │             │ (opt-in)     │              │              │                    │
+  │ Recommend   │ Enthusiastic │ Neutral      │ N/A          │ N/A                │
+  │ posture     │              │              │              │                    │
+  │ 10x check   │ Mandatory    │ Surface as   │ Optional     │ Skip               │
+  │             │              │ cherry-pick  │              │                    │
+  │ Platonic    │ Yes          │ No           │ No           │ No                 │
+  │ ideal       │              │              │              │                    │
+  │ Delight     │ Opt-in       │ Cherry-pick  │ Note if seen │ Skip               │
+  │ opps        │ ceremony     │ ceremony     │              │                    │
+  │ Complexity  │ "Is it big   │ "Is it right │ "Is it too   │ "Is it the bare    │
+  │ question    │  enough?"    │  + what else │  complex?"   │  minimum?"         │
+  │             │              │  is tempting"│              │                    │
+  │ Taste       │ Yes          │ Yes          │ No           │ No                 │
+  │ calibration │              │              │              │                    │
+  │ Temporal    │ Full (hr 1-6)│ Full (hr 1-6)│ Key decisions│ Skip               │
+  │ interrogate │              │              │  only        │                    │
+  │ Observ.     │ "Joy to      │ "Joy to      │ "Can we      │ "Can we see if     │
+  │ standard    │  operate"    │  operate"    │  debug it?"  │  it's broken?"     │
+  │ Deploy      │ Infra as     │ Safe deploy  │ Safe deploy  │ Simplest possible  │
+  │ standard    │ feature scope│ + cherry-pick│  + rollback  │  deploy            │
+  │             │              │  risk check  │              │                    │
+  │ Error map   │ Full + chaos │ Full + chaos │ Full         │ Critical paths     │
+  │             │  scenarios   │ for accepted │              │  only              │
+  │ CEO plan    │ Written      │ Written      │ Skipped      │ Skipped            │
+  │ Phase 2/3   │ Map accepted │ Map accepted │ Note it      │ Skip               │
+  │ planning    │              │ cherry-picks │              │                    │
+  └─────────────┴──────────────┴──────────────┴──────────────┴────────────────────┘
 ```
diff --git a/plan-ceo-review/SKILL.md.tmpl b/plan-ceo-review/SKILL.md.tmpl
index 8664d095..3165dc5b 100644
--- a/plan-ceo-review/SKILL.md.tmpl
+++ b/plan-ceo-review/SKILL.md.tmpl
@@ -3,9 +3,9 @@ name: plan-ceo-review
 version: 1.0.0
 description: |
   CEO/founder-mode plan review. Rethink the problem, find the 10-star product,
-  challenge premises, expand scope when it creates a better product. Three modes:
-  SCOPE EXPANSION (dream big), HOLD SCOPE (maximum rigor), SCOPE REDUCTION
-  (strip to essentials).
+  challenge premises, expand scope when it creates a better product. Four modes:
+  SCOPE EXPANSION (dream big), SELECTIVE EXPANSION (hold scope + cherry-pick
+  expansions), HOLD SCOPE (maximum rigor), SCOPE REDUCTION (strip to essentials).
 allowed-tools:
   - Read
   - Grep
@@ -23,10 +23,11 @@ allowed-tools:
 ## Philosophy
 You are not here to rubber-stamp this plan. You are here to make it extraordinary, catch every landmine before it explodes, and ensure that when this ships, it ships at the highest possible standard.
 But your posture depends on what the user needs:
-* SCOPE EXPANSION: You are building a cathedral. Envision the platonic ideal. Push scope UP. Ask "what would make this 10x better for 2x the effort?" The answer to "should we also build X?" is "yes, if it serves the vision." You have permission to dream.
+* SCOPE EXPANSION: You are building a cathedral. Envision the platonic ideal. Push scope UP. Ask "what would make this 10x better for 2x the effort?" You have permission to dream — and to recommend enthusiastically. But every expansion is the user's decision. Present each scope-expanding idea as an AskUserQuestion. The user opts in or out.
+* SELECTIVE EXPANSION: You are a rigorous reviewer who also has taste. Hold the current scope as your baseline — make it bulletproof. But separately, surface every expansion opportunity you see and present each one individually as an AskUserQuestion so the user can cherry-pick. Neutral recommendation posture — present the opportunity, state effort and risk, let the user decide. Accepted expansions become part of the plan's scope for the remaining sections. Rejected ones go to "NOT in scope."
 * HOLD SCOPE: You are a rigorous reviewer. The plan's scope is accepted. Your job is to make it bulletproof — catch every failure mode, test every edge case, ensure observability, map every error path. Do not silently reduce OR expand.
 * SCOPE REDUCTION: You are a surgeon. Find the minimum viable version that achieves the core outcome. Cut everything else. Be ruthless.
-Critical rule: Once the user selects a mode, COMMIT to it. Do not silently drift toward a different mode. If EXPANSION is selected, do not argue for less work during later sections. If REDUCTION is selected, do not sneak scope back in. Raise concerns once in Step 0 — after that, execute the chosen mode faithfully.
+Critical rule: In ALL modes, the user is 100% in control. Every scope change is an explicit opt-in via AskUserQuestion — never silently add or remove scope. Once the user selects a mode, COMMIT to it. Do not silently drift toward a different mode. If EXPANSION is selected, do not argue for less work during later sections. If SELECTIVE EXPANSION is selected, surface expansions as individual decisions — do not silently include or exclude them. If REDUCTION is selected, do not sneak scope back in. Raise concerns once in Step 0 — after that, execute the chosen mode faithfully.
 Do NOT make any code changes. Do NOT start implementation. Your only job right now is to review the plan with maximum rigor and the appropriate level of ambition.
 
 ## Prime Directives
@@ -82,7 +83,7 @@ Map:
 ### Retrospective Check
 Check the git log for this branch. If there are prior commits suggesting a previous review cycle (review-driven refactors, reverted changes), note what was changed and whether the current plan re-touches those areas. Be MORE aggressive reviewing areas that were previously problematic. Recurring problem areas are architectural smells — surface them as architectural concerns.
 
-### Taste Calibration (EXPANSION mode only)
+### Taste Calibration (EXPANSION and SELECTIVE EXPANSION modes)
 Identify 2-3 files or patterns in the existing codebase that are particularly well-designed. Note them as style references for the review. Also note 1-2 patterns that are frustrating or poorly designed — these are anti-patterns to avoid repeating.
 Report findings before proceeding to Step 0.
 
@@ -105,10 +106,20 @@ Describe the ideal end state of this system 12 months from now. Does this plan m
 ```
 
 ### 0D. Mode-Specific Analysis
-**For SCOPE EXPANSION** — run all three:
+**For SCOPE EXPANSION** — run all three, then the opt-in ceremony:
 1. 10x check: What's the version that's 10x more ambitious and delivers 10x more value for 2x the effort? Describe it concretely.
 2. Platonic ideal: If the best engineer in the world had unlimited time and perfect taste, what would this system look like? What would the user feel when using it? Start from experience, not architecture.
-3. Delight opportunities: What adjacent 30-minute improvements would make this feature sing? Things where a user would think "oh nice, they thought of that." List at least 3.
+3. Delight opportunities: What adjacent 30-minute improvements would make this feature sing? Things where a user would think "oh nice, they thought of that." List at least 5.
+4. **Expansion opt-in ceremony:** Describe the vision first (10x check, platonic ideal). Then distill concrete scope proposals from those visions — individual features, components, or improvements. Present each proposal as its own AskUserQuestion. Recommend enthusiastically — explain why it's worth doing. But the user decides. Options: **A)** Add to this plan's scope **B)** Defer to TODOS.md **C)** Skip. Accepted items become plan scope for all remaining review sections. Rejected items go to "NOT in scope."
+
+**For SELECTIVE EXPANSION** — run the HOLD SCOPE analysis first, then surface expansions:
+1. Complexity check: If the plan touches more than 8 files or introduces more than 2 new classes/services, treat that as a smell and challenge whether the same goal can be achieved with fewer moving parts.
+2. What is the minimum set of changes that achieves the stated goal? Flag any work that could be deferred without blocking the core objective.
+3. Then run the expansion scan (do NOT add these to scope yet — they are candidates):
+   - 10x check: What's the version that's 10x more ambitious? Describe it concretely.
+   - Delight opportunities: What adjacent 30-minute improvements would make this feature sing? List at least 5.
+   - Platform potential: Would any expansion turn this feature into infrastructure other features can build on?
+4. **Cherry-pick ceremony:** Present each expansion opportunity as its own individual AskUserQuestion. Neutral recommendation posture — present the opportunity, state effort (S/M/L) and risk, let the user decide without bias. Options: **A)** Add to this plan's scope **B)** Defer to TODOS.md **C)** Skip. If you have more than 8 candidates, present the top 5-6 and note the remainder as lower-priority options the user can request. Accepted items become plan scope for all remaining review sections. Rejected items go to "NOT in scope."
 
 **For HOLD SCOPE** — run this:
 1. Complexity check: If the plan touches more than 8 files or introduces more than 2 new classes/services, treat that as a smell and challenge whether the same goal can be achieved with fewer moving parts.
@@ -118,7 +129,57 @@ Describe the ideal end state of this system 12 months from now. Does this plan m
 1. Ruthless cut: What is the absolute minimum that ships value to a user? Everything else is deferred. No exceptions.
 2. What can be a follow-up PR? Separate "must ship together" from "nice to ship together."
 
-### 0E. Temporal Interrogation (EXPANSION and HOLD modes)
+### 0D-POST. Persist CEO Plan (EXPANSION and SELECTIVE EXPANSION only)
+
+After the opt-in/cherry-pick ceremony, write the plan to disk so the vision and decisions survive beyond this conversation. Only run this step for EXPANSION and SELECTIVE EXPANSION modes.
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+mkdir -p ~/.gstack/projects/$SLUG/ceo-plans
+```
+
+Before writing, check for existing CEO plans in the ceo-plans/ directory. If any are >30 days old or their branch has been merged/deleted, offer to archive them:
+
+```bash
+mkdir -p ~/.gstack/projects/$SLUG/ceo-plans/archive
+# For each stale plan: mv ~/.gstack/projects/$SLUG/ceo-plans/{old-plan}.md ~/.gstack/projects/$SLUG/ceo-plans/archive/
+```
+
+Write to `~/.gstack/projects/$SLUG/ceo-plans/{date}-{feature-slug}.md` using this format:
+
+```markdown
+---
+status: ACTIVE
+---
+# CEO Plan: {Feature Name}
+Generated by /plan-ceo-review on {date}
+Branch: {branch} | Mode: {EXPANSION / SELECTIVE EXPANSION}
+Repo: {owner/repo}
+
+## Vision
+
+### 10x Check
+{10x vision description}
+
+### Platonic Ideal
+{platonic ideal description — EXPANSION mode only}
+
+## Scope Decisions
+
+| # | Proposal | Effort | Decision | Reasoning |
+|---|----------|--------|----------|-----------|
+| 1 | {proposal} | S/M/L | ACCEPTED / DEFERRED / SKIPPED | {why} |
+
+## Accepted Scope (added to this plan)
+- {bullet list of what's now in scope}
+
+## Deferred to TODOS.md
+- {items with context}
+```
+
+Derive the feature slug from the plan being reviewed (e.g., "user-dashboard", "auth-refactor"). Use the date in YYYY-MM-DD format.
+
+### 0E. Temporal Interrogation (EXPANSION, SELECTIVE EXPANSION, and HOLD modes)
 Think ahead to implementation: What decisions will need to be made during implementation that should be resolved NOW in the plan?
 ```
   HOUR 1 (foundations):     What does the implementer need to know?
@@ -129,17 +190,22 @@ Think ahead to implementation: What decisions will need to be made during implem
 Surface these as questions for the user NOW, not as "figure it out later."
 
 ### 0F. Mode Selection
-Present three options:
-1. **SCOPE EXPANSION:** The plan is good but could be great. Propose the ambitious version, then review that. Push scope up. Build the cathedral.
-2. **HOLD SCOPE:** The plan's scope is right. Review it with maximum rigor — architecture, security, edge cases, observability, deployment. Make it bulletproof.
-3. **SCOPE REDUCTION:** The plan is overbuilt or wrong-headed. Propose a minimal version that achieves the core goal, then review that.
+In every mode, you are 100% in control. No scope is added without your explicit approval.
+
+Present four options:
+1. **SCOPE EXPANSION:** The plan is good but could be great. Dream big — propose the ambitious version. Every expansion is presented individually for your approval. You opt in to each one.
+2. **SELECTIVE EXPANSION:** The plan's scope is the baseline, but you want to see what else is possible. Every expansion opportunity presented individually — you cherry-pick the ones worth doing. Neutral recommendations.
+3. **HOLD SCOPE:** The plan's scope is right. Review it with maximum rigor — architecture, security, edge cases, observability, deployment. Make it bulletproof. No expansions surfaced.
+4. **SCOPE REDUCTION:** The plan is overbuilt or wrong-headed. Propose a minimal version that achieves the core goal, then review that.
 
 Context-dependent defaults:
 * Greenfield feature → default EXPANSION
+* Feature enhancement or iteration on existing system → default SELECTIVE EXPANSION
 * Bug fix or hotfix → default HOLD SCOPE
 * Refactor → default HOLD SCOPE
 * Plan touching >15 files → suggest REDUCTION unless user pushes back
 * User says "go big" / "ambitious" / "cathedral" → EXPANSION, no question
+* User says "hold scope but tempt me" / "show me options" / "cherry-pick" → SELECTIVE EXPANSION, no question
 
 Once selected, commit fully. Do not silently drift.
 **STOP.** AskUserQuestion once per issue. Do NOT batch. Recommend + WHY. If no issues or fix is obvious, state what you'll do and move on — don't waste a question. Do NOT proceed until user responds.
@@ -162,10 +228,12 @@ Evaluate and diagram:
 * Production failure scenarios. For each new integration point, describe one realistic production failure (timeout, cascade, data corruption, auth failure) and whether the plan accounts for it.
 * Rollback posture. If this ships and immediately breaks, what's the rollback procedure? Git revert? Feature flag? DB migration rollback? How long?
 
-**EXPANSION mode additions:**
+**EXPANSION and SELECTIVE EXPANSION additions:**
 * What would make this architecture beautiful? Not just correct — elegant. Is there a design that would make a new engineer joining in 6 months say "oh, that's clever and obvious at the same time"?
 * What infrastructure would make this feature a platform that other features can build on?
 
+**SELECTIVE EXPANSION:** If any accepted cherry-picks from Step 0D affect the architecture, evaluate their architectural fit here. Flag any that create coupling concerns or don't integrate cleanly — this is a chance to revisit the decision with new information.
+
 Required ASCII diagram: full system architecture showing new components and their relationships to existing ones.
 **STOP.** AskUserQuestion once per issue. Do NOT batch. Recommend + WHY. If no issues or fix is obvious, state what you'll do and move on — don't waste a question. Do NOT proceed until user responds.
 
@@ -324,8 +392,8 @@ Evaluate:
 * Admin tooling. New operational tasks that need admin UI or rake tasks?
 * Runbooks. For each new failure mode: what's the operational response?
 
-**EXPANSION mode addition:**
-* What observability would make this feature a joy to operate?
+**EXPANSION and SELECTIVE EXPANSION addition:**
+* What observability would make this feature a joy to operate? (For SELECTIVE EXPANSION, include observability for any accepted cherry-picks.)
 **STOP.** AskUserQuestion once per issue. Do NOT batch. Recommend + WHY. If no issues or fix is obvious, state what you'll do and move on — don't waste a question. Do NOT proceed until user responds.
 
 ### Section 9: Deployment & Rollout Review
@@ -339,8 +407,8 @@ Evaluate:
 * Post-deploy verification checklist. First 5 minutes? First hour?
 * Smoke tests. What automated checks should run immediately post-deploy?
 
-**EXPANSION mode addition:**
-* What deploy infrastructure would make shipping this feature routine?
+**EXPANSION and SELECTIVE EXPANSION addition:**
+* What deploy infrastructure would make shipping this feature routine? (For SELECTIVE EXPANSION, assess whether accepted cherry-picks change the deployment risk profile.)
 **STOP.** AskUserQuestion once per issue. Do NOT batch. Recommend + WHY. If no issues or fix is obvious, state what you'll do and move on — don't waste a question. Do NOT proceed until user responds.
 
 ### Section 10: Long-Term Trajectory Review
@@ -352,9 +420,10 @@ Evaluate:
 * Ecosystem fit. Aligns with Rails/JS ecosystem direction?
 * The 1-year question. Read this plan as a new engineer in 12 months — obvious?
 
-**EXPANSION mode additions:**
+**EXPANSION and SELECTIVE EXPANSION additions:**
 * What comes after this ships? Phase 2? Phase 3? Does the architecture support that trajectory?
 * Platform potential. Does this create capabilities other features can leverage?
+* (SELECTIVE EXPANSION only) Retrospective: Were the right cherry-picks accepted? Did any rejected expansions turn out to be load-bearing for the accepted ones?
 **STOP.** AskUserQuestion once per issue. Do NOT batch. Recommend + WHY. If no issues or fix is obvious, state what you'll do and move on — don't waste a question. Do NOT proceed until user responds.
 
 ## CRITICAL RULE — How to ask questions
@@ -403,8 +472,11 @@ For each TODO, describe:
 
 Then present options: **A)** Add to TODOS.md **B)** Skip — not valuable enough **C)** Build it now in this PR instead of deferring.
 
-### Delight Opportunities (EXPANSION mode only)
-Identify at least 5 "bonus chunk" opportunities (<30 min each) that would make users think "oh nice, they thought of that." Present each delight opportunity as its own individual AskUserQuestion. Never batch them. For each one, describe what it is, why it would delight users, and effort estimate. Then present options: **A)** Add to TODOS.md as a vision item **B)** Skip **C)** Build it now in this PR.
+### Scope Expansion Decisions (EXPANSION and SELECTIVE EXPANSION only)
+For EXPANSION and SELECTIVE EXPANSION modes: expansion opportunities and delight items were surfaced and decided in Step 0D (opt-in/cherry-pick ceremony). The decisions are persisted in the CEO plan document. Reference the CEO plan for the full record. Do not re-surface them here — list the accepted expansions for completeness:
+* Accepted: {list items added to scope}
+* Deferred: {list items sent to TODOS.md}
+* Skipped: {list items rejected}
 
 ### Diagrams (mandatory, produce all that apply)
 1. System architecture
@@ -422,7 +494,7 @@ List every ASCII diagram in files this plan touches. Still accurate?
   +====================================================================+
   |            MEGA PLAN REVIEW — COMPLETION SUMMARY                   |
   +====================================================================+
-  | Mode selected        | EXPANSION / HOLD / REDUCTION                |
+  | Mode selected        | EXPANSION / SELECTIVE / HOLD / REDUCTION     |
   | System Audit         | [key findings]                              |
   | Step 0               | [mode + key decisions]                      |
   | Section 1  (Arch)    | ___ issues found                            |
@@ -442,7 +514,8 @@ List every ASCII diagram in files this plan touches. Still accurate?
   | Error/rescue registry| ___ methods, ___ CRITICAL GAPS              |
   | Failure modes        | ___ total, ___ CRITICAL GAPS                |
   | TODOS.md updates     | ___ items proposed                          |
-  | Delight opportunities| ___ identified (EXPANSION only)             |
+  | Scope proposals      | ___ proposed, ___ accepted (EXP + SEL)      |
+  | CEO plan             | written / skipped (HOLD/REDUCTION)           |
   | Diagrams produced    | ___ (list types)                            |
   | Stale diagrams found | ___                                         |
   | Unresolved decisions | ___ (listed below)                          |
@@ -467,10 +540,21 @@ Before running this command, substitute the placeholder values from the Completi
 - **STATUS**: "clean" if 0 unresolved decisions AND 0 critical gaps; otherwise "issues_open"
 - **unresolved**: number from "Unresolved decisions" in the summary
 - **critical_gaps**: number from "Failure modes: ___ CRITICAL GAPS" in the summary
-- **MODE**: the mode the user selected (SCOPE_EXPANSION / HOLD_SCOPE / SCOPE_REDUCTION)
+- **MODE**: the mode the user selected (SCOPE_EXPANSION / SELECTIVE_EXPANSION / HOLD_SCOPE / SCOPE_REDUCTION)
 
 {{REVIEW_DASHBOARD}}
 
+## docs/designs Promotion (EXPANSION and SELECTIVE EXPANSION only)
+
+At the end of the review, if the vision produced a compelling feature direction, offer to promote the CEO plan to the project repo. AskUserQuestion:
+
+"The vision from this review produced {N} accepted scope expansions. Want to promote it to a design doc in the repo?"
+- **A)** Promote to `docs/designs/{FEATURE}.md` (committed to repo, visible to the team)
+- **B)** Keep in `~/.gstack/projects/` only (local, personal reference)
+- **C)** Skip
+
+If promoted, copy the CEO plan content to `docs/designs/{FEATURE}.md` (create the directory if needed) and update the `status` field in the original CEO plan from `ACTIVE` to `PROMOTED`.
+
 ## Formatting Rules
 * NUMBER issues (1, 2, 3...) and LETTERS for options (A, B, C...).
 * Label with NUMBER + LETTER (e.g., "3A", "3B").
@@ -480,30 +564,37 @@ Before running this command, substitute the placeholder values from the Completi
 
 ## Mode Quick Reference
 ```
-  ┌─────────────────────────────────────────────────────────────────┐
-  │                     MODE COMPARISON                             │
-  ├─────────────┬──────────────┬──────────────┬────────────────────┤
-  │             │  EXPANSION   │  HOLD SCOPE  │  REDUCTION         │
-  ├─────────────┼──────────────┼──────────────┼────────────────────┤
-  │ Scope       │ Push UP      │ Maintain     │ Push DOWN          │
-  │ 10x check   │ Mandatory    │ Optional     │ Skip               │
-  │ Platonic    │ Yes          │ No           │ No                 │
-  │ ideal       │              │              │                    │
-  │ Delight     │ 5+ items     │ Note if seen │ Skip               │
-  │ opps        │              │              │                    │
-  │ Complexity  │ "Is it big   │ "Is it too   │ "Is it the bare    │
-  │ question    │  enough?"    │  complex?"   │  minimum?"         │
-  │ Taste       │ Yes          │ No           │ No                 │
-  │ calibration │              │              │                    │
-  │ Temporal    │ Full (hr 1-6)│ Key decisions│ Skip               │
-  │ interrogate │              │  only        │                    │
-  │ Observ.     │ "Joy to      │ "Can we      │ "Can we see if     │
-  │ standard    │  operate"    │  debug it?"  │  it's broken?"     │
-  │ Deploy      │ Infra as     │ Safe deploy  │ Simplest possible  │
-  │ standard    │ feature scope│  + rollback  │  deploy            │
-  │ Error map   │ Full + chaos │ Full         │ Critical paths     │
-  │             │  scenarios   │              │  only              │
-  │ Phase 2/3   │ Map it       │ Note it      │ Skip               │
-  │ planning    │              │              │                    │
-  └─────────────┴──────────────┴──────────────┴────────────────────┘
+  ┌────────────────────────────────────────────────────────────────────────────────┐
+  │                            MODE COMPARISON                                     │
+  ├─────────────┬──────────────┬──────────────┬──────────────┬────────────────────┤
+  │             │  EXPANSION   │  SELECTIVE   │  HOLD SCOPE  │  REDUCTION         │
+  ├─────────────┼──────────────┼──────────────┼──────────────┼────────────────────┤
+  │ Scope       │ Push UP      │ Hold + offer │ Maintain     │ Push DOWN          │
+  │             │ (opt-in)     │              │              │                    │
+  │ Recommend   │ Enthusiastic │ Neutral      │ N/A          │ N/A                │
+  │ posture     │              │              │              │                    │
+  │ 10x check   │ Mandatory    │ Surface as   │ Optional     │ Skip               │
+  │             │              │ cherry-pick  │              │                    │
+  │ Platonic    │ Yes          │ No           │ No           │ No                 │
+  │ ideal       │              │              │              │                    │
+  │ Delight     │ Opt-in       │ Cherry-pick  │ Note if seen │ Skip               │
+  │ opps        │ ceremony     │ ceremony     │              │                    │
+  │ Complexity  │ "Is it big   │ "Is it right │ "Is it too   │ "Is it the bare    │
+  │ question    │  enough?"    │  + what else │  complex?"   │  minimum?"         │
+  │             │              │  is tempting"│              │                    │
+  │ Taste       │ Yes          │ Yes          │ No           │ No                 │
+  │ calibration │              │              │              │                    │
+  │ Temporal    │ Full (hr 1-6)│ Full (hr 1-6)│ Key decisions│ Skip               │
+  │ interrogate │              │              │  only        │                    │
+  │ Observ.     │ "Joy to      │ "Joy to      │ "Can we      │ "Can we see if     │
+  │ standard    │  operate"    │  operate"    │  debug it?"  │  it's broken?"     │
+  │ Deploy      │ Infra as     │ Safe deploy  │ Safe deploy  │ Simplest possible  │
+  │ standard    │ feature scope│ + cherry-pick│  + rollback  │  deploy            │
+  │             │              │  risk check  │              │                    │
+  │ Error map   │ Full + chaos │ Full + chaos │ Full         │ Critical paths     │
+  │             │  scenarios   │ for accepted │              │  only              │
+  │ CEO plan    │ Written      │ Written      │ Skipped      │ Skipped            │
+  │ Phase 2/3   │ Map accepted │ Map accepted │ Note it      │ Skip               │
+  │ planning    │              │ cherry-picks │              │                    │
+  └─────────────┴──────────────┴──────────────┴──────────────┴────────────────────┘
 ```
diff --git a/plan-design-review/SKILL.md b/plan-design-review/SKILL.md
index 8fb0bfeb..df5b43e8 100644
--- a/plan-design-review/SKILL.md
+++ b/plan-design-review/SKILL.md
@@ -576,11 +576,13 @@ Substitute values from the report:
 
 ## Review Readiness Dashboard
 
-After completing the review, read the review log to display the dashboard.
+After completing the review, read the review log and config to display the dashboard.
 
 ```bash
 eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 cat ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl 2>/dev/null || echo "NO_REVIEWS"
+echo "---CONFIG---"
+~/.claude/skills/gstack/bin/gstack-config get skip_eng_review 2>/dev/null || echo "false"
 ```
 
 Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
@@ -589,17 +591,23 @@ Parse the output. Find the most recent entry for each skill (plan-ceo-review, pl
 +====================================================================+
 |                    REVIEW READINESS DASHBOARD                       |
 +====================================================================+
-| Review          | Runs | Last Run            | Status               |
-|-----------------|------|---------------------|----------------------|
-| CEO Review      |  1   | 2026-03-16 14:30    | CLEAR                |
-| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR                |
-| Design Review   |  0   | —                   | NOT YET RUN          |
+| Review          | Runs | Last Run            | Status    | Required |
+|-----------------|------|---------------------|-----------|----------|
+| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR     | YES      |
+| CEO Review      |  0   | —                   | —         | no       |
+| Design Review   |  0   | —                   | —         | no       |
 +--------------------------------------------------------------------+
-| VERDICT: 2/3 CLEAR — Design Review not yet run                      |
+| VERDICT: CLEARED — Eng Review passed                                |
 +====================================================================+
 ```
 
+**Review tiers:**
+- **Eng Review (required by default):** The only review that gates shipping. Covers architecture, code quality, tests, performance. Can be disabled globally with \`gstack-config set skip_eng_review true\` (the "don't bother me" setting).
+- **CEO Review (optional):** Use your judgment. Recommend it for big product/business changes, new user-facing features, or scope decisions. Skip for bug fixes, refactors, infra, and cleanup.
+- **Design Review (optional):** Use your judgment. Recommend it for UI/UX changes. Skip for backend-only, infra, or prompt-only changes.
+
 **Verdict logic:**
-- **CLEARED TO SHIP (3/3)**: All three have >= 1 entry within 7 days AND most recent status is "clean"
-- **N/3 CLEAR**: Show count and list which are missing, have open issues, or are stale (>7 days)
-- Informational only — does NOT block.
+- **CLEARED**: Eng Review has >= 1 entry within 7 days with status "clean" (or \`skip_eng_review\` is \`true\`)
+- **NOT CLEARED**: Eng Review missing, stale (>7 days), or has open issues
+- CEO and Design reviews are shown for context but never block shipping
+- If \`skip_eng_review\` config is \`true\`, Eng Review shows "SKIPPED (global)" and verdict is CLEARED
diff --git a/plan-eng-review/SKILL.md b/plan-eng-review/SKILL.md
index b5c0775b..05d29242 100644
--- a/plan-eng-review/SKILL.md
+++ b/plan-eng-review/SKILL.md
@@ -277,11 +277,13 @@ Substitute values from the Completion Summary:
 
 ## Review Readiness Dashboard
 
-After completing the review, read the review log to display the dashboard.
+After completing the review, read the review log and config to display the dashboard.
 
 ```bash
 eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 cat ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl 2>/dev/null || echo "NO_REVIEWS"
+echo "---CONFIG---"
+~/.claude/skills/gstack/bin/gstack-config get skip_eng_review 2>/dev/null || echo "false"
 ```
 
 Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
@@ -290,20 +292,26 @@ Parse the output. Find the most recent entry for each skill (plan-ceo-review, pl
 +====================================================================+
 |                    REVIEW READINESS DASHBOARD                       |
 +====================================================================+
-| Review          | Runs | Last Run            | Status               |
-|-----------------|------|---------------------|----------------------|
-| CEO Review      |  1   | 2026-03-16 14:30    | CLEAR                |
-| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR                |
-| Design Review   |  0   | —                   | NOT YET RUN          |
+| Review          | Runs | Last Run            | Status    | Required |
+|-----------------|------|---------------------|-----------|----------|
+| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR     | YES      |
+| CEO Review      |  0   | —                   | —         | no       |
+| Design Review   |  0   | —                   | —         | no       |
 +--------------------------------------------------------------------+
-| VERDICT: 2/3 CLEAR — Design Review not yet run                      |
+| VERDICT: CLEARED — Eng Review passed                                |
 +====================================================================+
 ```
 
+**Review tiers:**
+- **Eng Review (required by default):** The only review that gates shipping. Covers architecture, code quality, tests, performance. Can be disabled globally with \`gstack-config set skip_eng_review true\` (the "don't bother me" setting).
+- **CEO Review (optional):** Use your judgment. Recommend it for big product/business changes, new user-facing features, or scope decisions. Skip for bug fixes, refactors, infra, and cleanup.
+- **Design Review (optional):** Use your judgment. Recommend it for UI/UX changes. Skip for backend-only, infra, or prompt-only changes.
+
 **Verdict logic:**
-- **CLEARED TO SHIP (3/3)**: All three have >= 1 entry within 7 days AND most recent status is "clean"
-- **N/3 CLEAR**: Show count and list which are missing, have open issues, or are stale (>7 days)
-- Informational only — does NOT block.
+- **CLEARED**: Eng Review has >= 1 entry within 7 days with status "clean" (or \`skip_eng_review\` is \`true\`)
+- **NOT CLEARED**: Eng Review missing, stale (>7 days), or has open issues
+- CEO and Design reviews are shown for context but never block shipping
+- If \`skip_eng_review\` config is \`true\`, Eng Review shows "SKIPPED (global)" and verdict is CLEARED
 
 ## Unresolved decisions
 If the user does not respond to an AskUserQuestion or interrupts to move on, note which decisions were left unresolved. At the end of the review, list these as "Unresolved decisions that may bite you later" — never silently default to an option.
diff --git a/scripts/gen-skill-docs.ts b/scripts/gen-skill-docs.ts
index a9d3bce6..ee8a1c09 100644
--- a/scripts/gen-skill-docs.ts
+++ b/scripts/gen-skill-docs.ts
@@ -817,11 +817,13 @@ Tie everything to user goals and product objectives. Always suggest specific imp
 function generateReviewDashboard(): string {
   return `## Review Readiness Dashboard
 
-After completing the review, read the review log to display the dashboard.
+After completing the review, read the review log and config to display the dashboard.
 
 \`\`\`bash
 eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 cat ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl 2>/dev/null || echo "NO_REVIEWS"
+echo "---CONFIG---"
+~/.claude/skills/gstack/bin/gstack-config get skip_eng_review 2>/dev/null || echo "false"
 \`\`\`
 
 Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
@@ -830,20 +832,26 @@ Parse the output. Find the most recent entry for each skill (plan-ceo-review, pl
 +====================================================================+
 |                    REVIEW READINESS DASHBOARD                       |
 +====================================================================+
-| Review          | Runs | Last Run            | Status               |
-|-----------------|------|---------------------|----------------------|
-| CEO Review      |  1   | 2026-03-16 14:30    | CLEAR                |
-| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR                |
-| Design Review   |  0   | —                   | NOT YET RUN          |
+| Review          | Runs | Last Run            | Status    | Required |
+|-----------------|------|---------------------|-----------|----------|
+| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR     | YES      |
+| CEO Review      |  0   | —                   | —         | no       |
+| Design Review   |  0   | —                   | —         | no       |
 +--------------------------------------------------------------------+
-| VERDICT: 2/3 CLEAR — Design Review not yet run                      |
+| VERDICT: CLEARED — Eng Review passed                                |
 +====================================================================+
 \`\`\`
 
+**Review tiers:**
+- **Eng Review (required by default):** The only review that gates shipping. Covers architecture, code quality, tests, performance. Can be disabled globally with \\\`gstack-config set skip_eng_review true\\\` (the "don't bother me" setting).
+- **CEO Review (optional):** Use your judgment. Recommend it for big product/business changes, new user-facing features, or scope decisions. Skip for bug fixes, refactors, infra, and cleanup.
+- **Design Review (optional):** Use your judgment. Recommend it for UI/UX changes. Skip for backend-only, infra, or prompt-only changes.
+
 **Verdict logic:**
-- **CLEARED TO SHIP (3/3)**: All three have >= 1 entry within 7 days AND most recent status is "clean"
-- **N/3 CLEAR**: Show count and list which are missing, have open issues, or are stale (>7 days)
-- Informational only — does NOT block.`;
+- **CLEARED**: Eng Review has >= 1 entry within 7 days with status "clean" (or \\\`skip_eng_review\\\` is \\\`true\\\`)
+- **NOT CLEARED**: Eng Review missing, stale (>7 days), or has open issues
+- CEO and Design reviews are shown for context but never block shipping
+- If \\\`skip_eng_review\\\` config is \\\`true\\\`, Eng Review shows "SKIPPED (global)" and verdict is CLEARED`;
 }
 
 const RESOLVERS: Record<string, () => string> = {
diff --git a/ship/SKILL.md b/ship/SKILL.md
index e7b8b753..b000f445 100644
--- a/ship/SKILL.md
+++ b/ship/SKILL.md
@@ -136,11 +136,13 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 
 ## Review Readiness Dashboard
 
-After completing the review, read the review log to display the dashboard.
+After completing the review, read the review log and config to display the dashboard.
 
 ```bash
 eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
 cat ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl 2>/dev/null || echo "NO_REVIEWS"
+echo "---CONFIG---"
+~/.claude/skills/gstack/bin/gstack-config get skip_eng_review 2>/dev/null || echo "false"
 ```
 
 Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
@@ -149,25 +151,32 @@ Parse the output. Find the most recent entry for each skill (plan-ceo-review, pl
 +====================================================================+
 |                    REVIEW READINESS DASHBOARD                       |
 +====================================================================+
-| Review          | Runs | Last Run            | Status               |
-|-----------------|------|---------------------|----------------------|
-| CEO Review      |  1   | 2026-03-16 14:30    | CLEAR                |
-| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR                |
-| Design Review   |  0   | —                   | NOT YET RUN          |
+| Review          | Runs | Last Run            | Status    | Required |
+|-----------------|------|---------------------|-----------|----------|
+| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR     | YES      |
+| CEO Review      |  0   | —                   | —         | no       |
+| Design Review   |  0   | —                   | —         | no       |
 +--------------------------------------------------------------------+
-| VERDICT: 2/3 CLEAR — Design Review not yet run                      |
+| VERDICT: CLEARED — Eng Review passed                                |
 +====================================================================+
 ```
 
+**Review tiers:**
+- **Eng Review (required by default):** The only review that gates shipping. Covers architecture, code quality, tests, performance. Can be disabled globally with \`gstack-config set skip_eng_review true\` (the "don't bother me" setting).
+- **CEO Review (optional):** Use your judgment. Recommend it for big product/business changes, new user-facing features, or scope decisions. Skip for bug fixes, refactors, infra, and cleanup.
+- **Design Review (optional):** Use your judgment. Recommend it for UI/UX changes. Skip for backend-only, infra, or prompt-only changes.
+
 **Verdict logic:**
-- **CLEARED TO SHIP (3/3)**: All three have >= 1 entry within 7 days AND most recent status is "clean"
-- **N/3 CLEAR**: Show count and list which are missing, have open issues, or are stale (>7 days)
-- Informational only — does NOT block.
-
-If the verdict is NOT "CLEARED TO SHIP (3/3)", use AskUserQuestion:
-- Show which reviews are missing or have open issues
-- RECOMMENDATION: Choose B (run missing reviews first) unless the change is trivial
-- Options: A) Ship anyway  B) Abort — run missing review(s) first  C) Reviews not relevant for this change
+- **CLEARED**: Eng Review has >= 1 entry within 7 days with status "clean" (or \`skip_eng_review\` is \`true\`)
+- **NOT CLEARED**: Eng Review missing, stale (>7 days), or has open issues
+- CEO and Design reviews are shown for context but never block shipping
+- If \`skip_eng_review\` config is \`true\`, Eng Review shows "SKIPPED (global)" and verdict is CLEARED
+
+If the verdict is NOT "CLEARED", use AskUserQuestion:
+- Show that Eng Review is missing or has open issues
+- RECOMMENDATION: Choose B (run eng review first) unless the change is obviously trivial (<20 lines, typo fix, config-only)
+- Options: A) Ship anyway  B) Abort — run /plan-eng-review first  C) Change is too small to need eng review
+- If CEO/Design reviews are missing, mention them as informational ("CEO Review not run — recommended for product changes") but do NOT block or recommend aborting for them
 
 ---
 
diff --git a/ship/SKILL.md.tmpl b/ship/SKILL.md.tmpl
index 2a24bea3..d38bfab3 100644
--- a/ship/SKILL.md.tmpl
+++ b/ship/SKILL.md.tmpl
@@ -54,10 +54,11 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 
 {{REVIEW_DASHBOARD}}
 
-If the verdict is NOT "CLEARED TO SHIP (3/3)", use AskUserQuestion:
-- Show which reviews are missing or have open issues
-- RECOMMENDATION: Choose B (run missing reviews first) unless the change is trivial
-- Options: A) Ship anyway  B) Abort — run missing review(s) first  C) Reviews not relevant for this change
+If the verdict is NOT "CLEARED", use AskUserQuestion:
+- Show that Eng Review is missing or has open issues
+- RECOMMENDATION: Choose B (run eng review first) unless the change is obviously trivial (<20 lines, typo fix, config-only)
+- Options: A) Ship anyway  B) Abort — run /plan-eng-review first  C) Change is too small to need eng review
+- If CEO/Design reviews are missing, mention them as informational ("CEO Review not run — recommended for product changes") but do NOT block or recommend aborting for them
 
 ---
 
diff --git a/test/gen-skill-docs.test.ts b/test/gen-skill-docs.test.ts
index 26de63db..c3861e8d 100644
--- a/test/gen-skill-docs.test.ts
+++ b/test/gen-skill-docs.test.ts
@@ -343,9 +343,10 @@ describe('REVIEW_DASHBOARD resolver', () => {
   test('resolver output contains key dashboard elements', () => {
     const content = fs.readFileSync(path.join(ROOT, 'plan-ceo-review', 'SKILL.md'), 'utf-8');
     expect(content).toContain('VERDICT');
-    expect(content).toContain('CLEARED TO SHIP');
-    expect(content).toContain('NOT YET RUN');
+    expect(content).toContain('CLEARED');
+    expect(content).toContain('Eng Review');
     expect(content).toContain('7 days');
     expect(content).toContain('Design Review');
+    expect(content).toContain('skip_eng_review');
   });
 });
diff --git a/test/skill-e2e.test.ts b/test/skill-e2e.test.ts
index 4378c322..ade94b39 100644
--- a/test/skill-e2e.test.ts
+++ b/test/skill-e2e.test.ts
@@ -852,6 +852,89 @@ Focus on reviewing the plan content: architecture, error handling, security, and
   }, 420_000);
 });
 
+// --- Plan CEO Review (SELECTIVE EXPANSION) E2E ---
+
+describeE2E('Plan CEO Review SELECTIVE EXPANSION E2E', () => {
+  let planDir: string;
+
+  beforeAll(() => {
+    planDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-plan-ceo-sel-'));
+    const { spawnSync } = require('child_process');
+    const run = (cmd: string, args: string[]) =>
+      spawnSync(cmd, args, { cwd: planDir, stdio: 'pipe', timeout: 5000 });
+
+    run('git', ['init']);
+    run('git', ['config', 'user.email', 'test@test.com']);
+    run('git', ['config', 'user.name', 'Test']);
+
+    fs.writeFileSync(path.join(planDir, 'plan.md'), `# Plan: Add User Dashboard
+
+## Context
+We're building a new user dashboard that shows recent activity, notifications, and quick actions.
+
+## Changes
+1. New React component \`UserDashboard\` in \`src/components/\`
+2. REST API endpoint \`GET /api/dashboard\` returning user stats
+3. PostgreSQL query for activity aggregation
+4. Redis cache layer for dashboard data (5min TTL)
+
+## Architecture
+- Frontend: React + TailwindCSS
+- Backend: Express.js REST API
+- Database: PostgreSQL with existing user/activity tables
+- Cache: Redis for dashboard aggregates
+
+## Open questions
+- Should we use WebSocket for real-time updates?
+- How do we handle users with 100k+ activity records?
+`);
+
+    run('git', ['add', '.']);
+    run('git', ['commit', '-m', 'add plan']);
+
+    fs.mkdirSync(path.join(planDir, 'plan-ceo-review'), { recursive: true });
+    fs.copyFileSync(
+      path.join(ROOT, 'plan-ceo-review', 'SKILL.md'),
+      path.join(planDir, 'plan-ceo-review', 'SKILL.md'),
+    );
+  });
+
+  afterAll(() => {
+    try { fs.rmSync(planDir, { recursive: true, force: true }); } catch {}
+  });
+
+  test('/plan-ceo-review SELECTIVE EXPANSION produces structured review output', async () => {
+    const result = await runSkillTest({
+      prompt: `Read plan-ceo-review/SKILL.md for the review workflow.
+
+Read plan.md — that's the plan to review. This is a standalone plan document, not a codebase — skip any codebase exploration or system audit steps.
+
+Choose SELECTIVE EXPANSION mode. Skip any AskUserQuestion calls — this is non-interactive.
+For the cherry-pick ceremony, accept all expansion proposals automatically.
+Write your complete review directly to ${planDir}/review-output-selective.md
+
+Focus on reviewing the plan content: architecture, error handling, security, and performance.`,
+      workingDirectory: planDir,
+      maxTurns: 15,
+      timeout: 360_000,
+      testName: 'plan-ceo-review-selective',
+      runId,
+    });
+
+    logCost('/plan-ceo-review (SELECTIVE)', result);
+    recordE2E('/plan-ceo-review-selective', 'Plan CEO Review SELECTIVE EXPANSION E2E', result, {
+      passed: ['success', 'error_max_turns'].includes(result.exitReason),
+    });
+    expect(['success', 'error_max_turns']).toContain(result.exitReason);
+
+    const reviewPath = path.join(planDir, 'review-output-selective.md');
+    if (fs.existsSync(reviewPath)) {
+      const review = fs.readFileSync(reviewPath, 'utf-8');
+      expect(review.length).toBeGreaterThan(200);
+    }
+  }, 420_000);
+});
+
 // --- Plan Eng Review E2E ---
 
 describeE2E('Plan Eng Review E2E', () => {
diff --git a/test/skill-validation.test.ts b/test/skill-validation.test.ts
index 78a9bef7..4231a91d 100644
--- a/test/skill-validation.test.ts
+++ b/test/skill-validation.test.ts
@@ -666,6 +666,36 @@ describe('Planted-bug fixture validation', () => {
   });
 });
 
+// --- CEO review mode validation ---
+
+describe('CEO review mode validation', () => {
+  const content = fs.readFileSync(path.join(ROOT, 'plan-ceo-review', 'SKILL.md'), 'utf-8');
+
+  test('has all four CEO review modes defined', () => {
+    const modes = ['SCOPE EXPANSION', 'SELECTIVE EXPANSION', 'HOLD SCOPE', 'SCOPE REDUCTION'];
+    for (const mode of modes) {
+      expect(content).toContain(mode);
+    }
+  });
+
+  test('has CEO plan persistence step', () => {
+    expect(content).toContain('ceo-plans');
+    expect(content).toContain('status: ACTIVE');
+  });
+
+  test('has docs/designs promotion section', () => {
+    expect(content).toContain('docs/designs');
+    expect(content).toContain('PROMOTED');
+  });
+
+  test('mode quick reference has four columns', () => {
+    expect(content).toContain('EXPANSION');
+    expect(content).toContain('SELECTIVE');
+    expect(content).toContain('HOLD SCOPE');
+    expect(content).toContain('REDUCTION');
+  });
+});
+
 // --- gstack-slug helper ---
 
 describe('gstack-slug', () => {

From b65a464d37e564a0623e6358d2d7a3080b386647 Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 12:41:44 -0500
Subject: [PATCH 14/22] feat: always-full eng review + ship review gate
 persistence (v0.5.4) (#135)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Remove SMALL/BIG CHANGE menu from /plan-eng-review — every plan gets the
full interactive review. Scope reduction is now proactive (only when
complexity check triggers) rather than a menu item.

Add review gate override persistence to /ship — when the user says "ship
anyway" or "not relevant", that decision is saved to the branch's
reviews.jsonl so subsequent /ship runs don't re-ask.

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 CHANGELOG.md                  | 11 +++++++++++
 VERSION                       |  2 +-
 plan-eng-review/SKILL.md      | 14 ++++++--------
 plan-eng-review/SKILL.md.tmpl | 14 ++++++--------
 ship/SKILL.md                 | 26 +++++++++++++++++++++-----
 ship/SKILL.md.tmpl            | 26 +++++++++++++++++++++-----
 test/skill-e2e.test.ts        |  4 ++--
 7 files changed, 68 insertions(+), 29 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index a61be2db..4a98b635 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,16 @@
 # Changelog
 
+## 0.5.4 — 2026-03-17
+
+- **Engineering review is always the full review now.** `/plan-eng-review` no longer asks you to choose between "big change" and "small change" modes. Every plan gets the full interactive walkthrough (architecture, code quality, tests, performance). Scope reduction is only suggested when the complexity check actually triggers — not as a standing menu option.
+- **Ship stops asking about reviews once you've answered.** When `/ship` asks about missing reviews and you say "ship anyway" or "not relevant," that decision is saved for the branch. No more getting re-asked every time you re-run `/ship` after a pre-landing fix.
+
+### For contributors
+
+- Removed SMALL_CHANGE / BIG_CHANGE / SCOPE_REDUCTION menu from `plan-eng-review/SKILL.md.tmpl`. Scope reduction is now proactive (triggered by complexity check) rather than a menu item.
+- Added review gate override persistence to `ship/SKILL.md.tmpl` — writes `ship-review-override` entries to `$BRANCH-reviews.jsonl` so subsequent `/ship` runs skip the gate.
+- Updated 2 E2E test prompts to match new flow.
+
 ## 0.5.3 — 2026-03-17
 
 - **You're always in control — even when dreaming big.** `/plan-ceo-review` now presents every scope expansion as an individual decision you opt into. EXPANSION mode recommends enthusiastically, but you say yes or no to each idea. No more "the agent went wild and added 5 features I didn't ask for."
diff --git a/VERSION b/VERSION
index be14282b..7d856835 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.5.3
+0.5.4
diff --git a/plan-eng-review/SKILL.md b/plan-eng-review/SKILL.md
index 05d29242..d4e9a83e 100644
--- a/plan-eng-review/SKILL.md
+++ b/plan-eng-review/SKILL.md
@@ -110,12 +110,11 @@ Before reviewing anything, answer these questions:
 3. **Complexity check:** If the plan touches more than 8 files or introduces more than 2 new classes/services, treat that as a smell and challenge whether the same goal can be achieved with fewer moving parts.
 4. **TODOS cross-reference:** Read `TODOS.md` if it exists. Are any deferred items blocking this plan? Can any deferred items be bundled into this PR without expanding scope? Does this plan create new work that should be captured as a TODO?
 
-Then ask if I want one of three options:
-1. **SCOPE REDUCTION:** The plan is overbuilt. Propose a minimal version that achieves the core goal, then review that.
-2. **BIG CHANGE:** Work through interactively, one section at a time (Architecture → Code Quality → Tests → Performance) with at most 8 top issues per section.
-3. **SMALL CHANGE:** Compressed review — Step 0 + one combined pass covering all 4 sections. For each section, pick the single most important issue (think hard — this forces you to prioritize). Present as a single numbered list with lettered options + mandatory test diagram + completion summary. One AskUserQuestion round at the end. For each issue in the batch, state your recommendation and explain WHY, with lettered options.
+If the complexity check triggers (8+ files or 2+ new classes/services), proactively recommend scope reduction via AskUserQuestion — explain what's overbuilt, propose a minimal version that achieves the core goal, and ask whether to reduce or proceed as-is. If the complexity check does not trigger, present your Step 0 findings and proceed directly to Section 1.
 
-**Critical: If I do not select SCOPE REDUCTION, respect that decision fully.** Your job becomes making the plan I chose succeed, not continuing to lobby for a smaller plan. Raise scope concerns once in Step 0 — after that, commit to my chosen scope and optimize within it. Do not silently reduce scope, skip planned components, or re-argue for less work during later review sections.
+Always work through the full interactive review: one section at a time (Architecture → Code Quality → Tests → Performance) with at most 8 top issues per section.
+
+**Critical: Once the user accepts or rejects a scope reduction recommendation, commit fully.** Do not re-argue for smaller scope during later review sections. Do not silently reduce scope or skip planned components.
 
 ## Review Sections (after scope is agreed)
 
@@ -201,7 +200,6 @@ Follow the AskUserQuestion format from the Preamble above. Additional rules for
 * **Map the reasoning to my engineering preferences above.** One sentence connecting your recommendation to a specific preference (DRY, explicit > clever, minimal diff, etc.).
 * Label with issue NUMBER + option LETTER (e.g., "3A", "3B").
 * **Escape hatch:** If a section has no issues, say so and move on. If an issue has an obvious fix with no real alternatives, state what you'll do and move on — don't waste a question on it. Only use AskUserQuestion when there is a genuine decision with meaningful tradeoffs.
-* **Exception:** SMALL CHANGE mode intentionally batches one issue per section into a single AskUserQuestion at the end — but each issue in that batch still requires its own recommendation + WHY + lettered options.
 
 ## Required outputs
 
@@ -239,7 +237,7 @@ If any failure mode has no test AND no error handling AND would be silent, flag
 
 ### Completion summary
 At the end of the review, fill in and display this summary so the user can see all findings at a glance:
-- Step 0: Scope Challenge (user chose: ___)
+- Step 0: Scope Challenge — ___ (scope accepted as-is / scope reduced per recommendation)
 - Architecture Review: ___ issues found
 - Code Quality Review: ___ issues found
 - Test Review: diagram produced, ___ gaps identified
@@ -273,7 +271,7 @@ Substitute values from the Completion Summary:
 - **STATUS**: "clean" if 0 unresolved decisions AND 0 critical gaps; otherwise "issues_open"
 - **unresolved**: number from "Unresolved decisions" count
 - **critical_gaps**: number from "Failure modes: ___ critical gaps flagged"
-- **MODE**: SCOPE_REDUCTION / BIG_CHANGE / SMALL_CHANGE
+- **MODE**: FULL_REVIEW / SCOPE_REDUCED
 
 ## Review Readiness Dashboard
 
diff --git a/plan-eng-review/SKILL.md.tmpl b/plan-eng-review/SKILL.md.tmpl
index 4905d8d3..3433cb75 100644
--- a/plan-eng-review/SKILL.md.tmpl
+++ b/plan-eng-review/SKILL.md.tmpl
@@ -45,12 +45,11 @@ Before reviewing anything, answer these questions:
 3. **Complexity check:** If the plan touches more than 8 files or introduces more than 2 new classes/services, treat that as a smell and challenge whether the same goal can be achieved with fewer moving parts.
 4. **TODOS cross-reference:** Read `TODOS.md` if it exists. Are any deferred items blocking this plan? Can any deferred items be bundled into this PR without expanding scope? Does this plan create new work that should be captured as a TODO?
 
-Then ask if I want one of three options:
-1. **SCOPE REDUCTION:** The plan is overbuilt. Propose a minimal version that achieves the core goal, then review that.
-2. **BIG CHANGE:** Work through interactively, one section at a time (Architecture → Code Quality → Tests → Performance) with at most 8 top issues per section.
-3. **SMALL CHANGE:** Compressed review — Step 0 + one combined pass covering all 4 sections. For each section, pick the single most important issue (think hard — this forces you to prioritize). Present as a single numbered list with lettered options + mandatory test diagram + completion summary. One AskUserQuestion round at the end. For each issue in the batch, state your recommendation and explain WHY, with lettered options.
+If the complexity check triggers (8+ files or 2+ new classes/services), proactively recommend scope reduction via AskUserQuestion — explain what's overbuilt, propose a minimal version that achieves the core goal, and ask whether to reduce or proceed as-is. If the complexity check does not trigger, present your Step 0 findings and proceed directly to Section 1.
 
-**Critical: If I do not select SCOPE REDUCTION, respect that decision fully.** Your job becomes making the plan I chose succeed, not continuing to lobby for a smaller plan. Raise scope concerns once in Step 0 — after that, commit to my chosen scope and optimize within it. Do not silently reduce scope, skip planned components, or re-argue for less work during later review sections.
+Always work through the full interactive review: one section at a time (Architecture → Code Quality → Tests → Performance) with at most 8 top issues per section.
+
+**Critical: Once the user accepts or rejects a scope reduction recommendation, commit fully.** Do not re-argue for smaller scope during later review sections. Do not silently reduce scope or skip planned components.
 
 ## Review Sections (after scope is agreed)
 
@@ -136,7 +135,6 @@ Follow the AskUserQuestion format from the Preamble above. Additional rules for
 * **Map the reasoning to my engineering preferences above.** One sentence connecting your recommendation to a specific preference (DRY, explicit > clever, minimal diff, etc.).
 * Label with issue NUMBER + option LETTER (e.g., "3A", "3B").
 * **Escape hatch:** If a section has no issues, say so and move on. If an issue has an obvious fix with no real alternatives, state what you'll do and move on — don't waste a question on it. Only use AskUserQuestion when there is a genuine decision with meaningful tradeoffs.
-* **Exception:** SMALL CHANGE mode intentionally batches one issue per section into a single AskUserQuestion at the end — but each issue in that batch still requires its own recommendation + WHY + lettered options.
 
 ## Required outputs
 
@@ -174,7 +172,7 @@ If any failure mode has no test AND no error handling AND would be silent, flag
 
 ### Completion summary
 At the end of the review, fill in and display this summary so the user can see all findings at a glance:
-- Step 0: Scope Challenge (user chose: ___)
+- Step 0: Scope Challenge — ___ (scope accepted as-is / scope reduced per recommendation)
 - Architecture Review: ___ issues found
 - Code Quality Review: ___ issues found
 - Test Review: diagram produced, ___ gaps identified
@@ -208,7 +206,7 @@ Substitute values from the Completion Summary:
 - **STATUS**: "clean" if 0 unresolved decisions AND 0 critical gaps; otherwise "issues_open"
 - **unresolved**: number from "Unresolved decisions" count
 - **critical_gaps**: number from "Failure modes: ___ critical gaps flagged"
-- **MODE**: SCOPE_REDUCTION / BIG_CHANGE / SMALL_CHANGE
+- **MODE**: FULL_REVIEW / SCOPE_REDUCED
 
 {{REVIEW_DASHBOARD}}
 
diff --git a/ship/SKILL.md b/ship/SKILL.md
index b000f445..dc1a86a2 100644
--- a/ship/SKILL.md
+++ b/ship/SKILL.md
@@ -172,11 +172,27 @@ Parse the output. Find the most recent entry for each skill (plan-ceo-review, pl
 - CEO and Design reviews are shown for context but never block shipping
 - If \`skip_eng_review\` config is \`true\`, Eng Review shows "SKIPPED (global)" and verdict is CLEARED
 
-If the verdict is NOT "CLEARED", use AskUserQuestion:
-- Show that Eng Review is missing or has open issues
-- RECOMMENDATION: Choose B (run eng review first) unless the change is obviously trivial (<20 lines, typo fix, config-only)
-- Options: A) Ship anyway  B) Abort — run /plan-eng-review first  C) Change is too small to need eng review
-- If CEO/Design reviews are missing, mention them as informational ("CEO Review not run — recommended for product changes") but do NOT block or recommend aborting for them
+If the Eng Review is NOT "CLEAR":
+
+1. **Check for a prior override on this branch:**
+   ```bash
+   eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+   grep '"skill":"ship-review-override"' ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl 2>/dev/null || echo "NO_OVERRIDE"
+   ```
+   If an override exists, display the dashboard and note "Review gate previously accepted — continuing." Do NOT ask again.
+
+2. **If no override exists,** use AskUserQuestion:
+   - Show that Eng Review is missing or has open issues
+   - RECOMMENDATION: Choose C if the change is obviously trivial (< 20 lines, typo fix, config-only); Choose B for larger changes
+   - Options: A) Ship anyway  B) Abort — run /plan-eng-review first  C) Change is too small to need eng review
+   - If CEO/Design reviews are missing, mention them as informational ("CEO Review not run — recommended for product changes") but do NOT block or recommend aborting for them
+
+3. **If the user chooses A or C,** persist the decision so future `/ship` runs on this branch skip the gate:
+   ```bash
+   eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+   echo '{"skill":"ship-review-override","timestamp":"'"$(date -u +%Y-%m-%dT%H:%M:%SZ)"'","decision":"USER_CHOICE"}' >> ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl
+   ```
+   Substitute USER_CHOICE with "ship_anyway" or "not_relevant".
 
 ---
 
diff --git a/ship/SKILL.md.tmpl b/ship/SKILL.md.tmpl
index d38bfab3..bb6db158 100644
--- a/ship/SKILL.md.tmpl
+++ b/ship/SKILL.md.tmpl
@@ -54,11 +54,27 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 
 {{REVIEW_DASHBOARD}}
 
-If the verdict is NOT "CLEARED", use AskUserQuestion:
-- Show that Eng Review is missing or has open issues
-- RECOMMENDATION: Choose B (run eng review first) unless the change is obviously trivial (<20 lines, typo fix, config-only)
-- Options: A) Ship anyway  B) Abort — run /plan-eng-review first  C) Change is too small to need eng review
-- If CEO/Design reviews are missing, mention them as informational ("CEO Review not run — recommended for product changes") but do NOT block or recommend aborting for them
+If the Eng Review is NOT "CLEAR":
+
+1. **Check for a prior override on this branch:**
+   ```bash
+   eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+   grep '"skill":"ship-review-override"' ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl 2>/dev/null || echo "NO_OVERRIDE"
+   ```
+   If an override exists, display the dashboard and note "Review gate previously accepted — continuing." Do NOT ask again.
+
+2. **If no override exists,** use AskUserQuestion:
+   - Show that Eng Review is missing or has open issues
+   - RECOMMENDATION: Choose C if the change is obviously trivial (< 20 lines, typo fix, config-only); Choose B for larger changes
+   - Options: A) Ship anyway  B) Abort — run /plan-eng-review first  C) Change is too small to need eng review
+   - If CEO/Design reviews are missing, mention them as informational ("CEO Review not run — recommended for product changes") but do NOT block or recommend aborting for them
+
+3. **If the user chooses A or C,** persist the decision so future `/ship` runs on this branch skip the gate:
+   ```bash
+   eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+   echo '{"skill":"ship-review-override","timestamp":"'"$(date -u +%Y-%m-%dT%H:%M:%SZ)"'","decision":"USER_CHOICE"}' >> ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl
+   ```
+   Substitute USER_CHOICE with "ship_anyway" or "not_relevant".
 
 ---
 
diff --git a/test/skill-e2e.test.ts b/test/skill-e2e.test.ts
index ade94b39..e50f688e 100644
--- a/test/skill-e2e.test.ts
+++ b/test/skill-e2e.test.ts
@@ -1003,7 +1003,7 @@ Replace session-cookie auth with JWT tokens. Currently using express-session + R
 
 Read plan.md — that's the plan to review. This is a standalone plan document, not a codebase — skip any codebase exploration steps.
 
-Choose SMALL CHANGE mode. Skip any AskUserQuestion calls — this is non-interactive.
+Proceed directly to the full review. Skip any AskUserQuestion calls — this is non-interactive.
 Write your complete review directly to ${planDir}/review-output.md
 
 Focus on architecture, code quality, tests, and performance sections.`,
@@ -1404,7 +1404,7 @@ export function main() { return Dashboard(); }
 
 Read plan.md — that's the plan to review. This is a standalone plan with source code in app.ts and dashboard.ts.
 
-Choose SMALL CHANGE mode. Skip any AskUserQuestion calls — this is non-interactive.
+Proceed directly to the full review. Skip any AskUserQuestion calls — this is non-interactive.
 
 IMPORTANT: After your review, you MUST write the test-plan artifact as described in the "Test Plan Artifact" section of SKILL.md. The remote-slug shim is at ${planDir}/browse/bin/remote-slug.
 

From a2d756f945854a8ad8b61f8c84021f0f221d223c Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 13:05:18 -0500
Subject: [PATCH 15/22] feat: Test Bootstrap + Regression Tests + Coverage
 Audit (v0.6.0) (#136)

* feat: test bootstrap, regression tests, coverage audit, retro test health

- Add {{TEST_BOOTSTRAP}} resolver to gen-skill-docs.ts
- Add Phase 8e.5 regression test generation to /qa and /qa-design-review
- Add Step 3.4 test coverage audit with quality scoring to /ship
- Add test health tracking to /retro
- Add 2 E2E evals (bootstrap + coverage audit)
- Add 26 validation tests
- Update ARCHITECTURE.md placeholder table
- Add 2 P3 TODOs (CI/CD non-GitHub, auto-upgrade weak tests)

* chore: bump version and changelog (v0.6.0)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* feat: make coverage audit trace actual codepaths, not just syntax patterns

Step 3.4 now instructs Claude to read full files, trace data flow through
every branch, diagram the execution, and check each branch against tests.
Phase 8e.5 regression tests now trace the bug's codepath before writing
the test, catching adjacent edge cases.

* feat: coverage audit now maps user flows, interactions, and error states

Step 3.4 now covers the full picture: code branches AND user-facing behavior.
Maps user flows (complete journey through the feature), interaction edge cases
(double-click, back button, stale state, slow connection), error states
(what does the user actually see?), and boundary states (zero results,
10k results, max-length input). Coverage diagram splits into Code Path
Coverage and User Flow Coverage sections with separate percentages.

* fix: raise test gen cap to 20, add validation tests for user flow coverage

- Raise Step 3.4 test generation cap from 10 to 20 (code + user flow combined)
- Add 3 validation tests: codepath tracing, user flow mapping, diagram sections

---------

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 ARCHITECTURE.md                    |   2 +
 CHANGELOG.md                       |  21 ++
 TODOS.md                           |  24 +++
 VERSION                            |   2 +-
 qa-design-review/SKILL.md          | 170 +++++++++++++++-
 qa-design-review/SKILL.md.tmpl     |  19 +-
 qa-only/SKILL.md                   |   1 +
 qa-only/SKILL.md.tmpl              |   1 +
 qa/SKILL.md                        | 211 +++++++++++++++++++-
 qa/SKILL.md.tmpl                   |  60 +++++-
 qa/templates/qa-report-template.md |  16 ++
 retro/SKILL.md                     |  29 ++-
 retro/SKILL.md.tmpl                |  29 ++-
 scripts/gen-skill-docs.ts          | 156 +++++++++++++++
 ship/SKILL.md                      | 302 +++++++++++++++++++++++++++++
 ship/SKILL.md.tmpl                 | 151 +++++++++++++++
 test/skill-e2e.test.ts             | 263 +++++++++++++++++++++++++
 test/skill-validation.test.ts      | 222 +++++++++++++++++++++
 18 files changed, 1672 insertions(+), 7 deletions(-)

diff --git a/ARCHITECTURE.md b/ARCHITECTURE.md
index bccb13ff..79bfda75 100644
--- a/ARCHITECTURE.md
+++ b/ARCHITECTURE.md
@@ -203,6 +203,8 @@ Templates contain the workflows, tips, and examples that require human judgment.
 | `{{BASE_BRANCH_DETECT}}` | `gen-skill-docs.ts` | Dynamic base branch detection for PR-targeting skills (ship, review, qa, plan-ceo-review) |
 | `{{QA_METHODOLOGY}}` | `gen-skill-docs.ts` | Shared QA methodology block for /qa and /qa-only |
 | `{{DESIGN_METHODOLOGY}}` | `gen-skill-docs.ts` | Shared design audit methodology for /plan-design-review and /qa-design-review |
+| `{{REVIEW_DASHBOARD}}` | `gen-skill-docs.ts` | Review Readiness Dashboard for /ship pre-flight |
+| `{{TEST_BOOTSTRAP}}` | `gen-skill-docs.ts` | Test framework detection, bootstrap, CI/CD setup for /qa, /ship, /qa-design-review |
 
 This is structurally sound — if a command exists in code, it appears in docs. If it doesn't exist, it can't appear.
 
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 4a98b635..12fa243b 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,26 @@
 # Changelog
 
+## 0.6.0 — 2026-03-17
+
+- **100% test coverage is the key to great vibe coding.** gstack now bootstraps test frameworks from scratch when your project doesn't have one. Detects your runtime, researches the best framework, asks you to pick, installs it, writes 3-5 real tests for your actual code, sets up CI/CD (GitHub Actions), creates TESTING.md, and adds test culture instructions to CLAUDE.md. Every Claude Code session after that writes tests naturally.
+- **Every bug fix now gets a regression test.** When `/qa` fixes a bug and verifies it, Phase 8e.5 automatically generates a regression test that catches the exact scenario that broke. Tests include full attribution tracing back to the QA report. Auto-incrementing filenames prevent collisions across sessions.
+- **Ship with confidence — coverage audit shows what's tested and what's not.** `/ship` Step 3.4 builds a code path map from your diff, searches for corresponding tests, and produces an ASCII coverage diagram with quality stars (★★★ = edge cases + errors, ★★ = happy path, ★ = smoke test). Gaps get tests auto-generated. PR body shows "Tests: 42 → 47 (+5 new)".
+- **Your retro tracks test health.** `/retro` now shows total test files, tests added this period, regression test commits, and trend deltas. If test ratio drops below 20%, it flags it as a growth area.
+- **Design reviews generate regression tests too.** `/qa-design-review` Phase 8e.5 skips CSS-only fixes (those are caught by re-running the design audit) but writes tests for JavaScript behavior changes like broken dropdowns or animation failures.
+
+### For contributors
+
+- Added `generateTestBootstrap()` resolver to `gen-skill-docs.ts` (~155 lines). Registered as `{{TEST_BOOTSTRAP}}` in the RESOLVERS map. Inserted into qa, ship (Step 2.5), and qa-design-review templates.
+- Phase 8e.5 regression test generation added to `qa/SKILL.md.tmpl` (46 lines) and CSS-aware variant to `qa-design-review/SKILL.md.tmpl` (12 lines). Rule 13 amended to allow creating new test files.
+- Step 3.4 test coverage audit added to `ship/SKILL.md.tmpl` (88 lines) with quality scoring rubric and ASCII diagram format.
+- Test health tracking added to `retro/SKILL.md.tmpl`: 3 new data gathering commands, metrics row, narrative section, JSON schema field.
+- `qa-only/SKILL.md.tmpl` gets recommendation note when no test framework detected.
+- `qa-report-template.md` gains Regression Tests section with deferred test specs.
+- ARCHITECTURE.md placeholder table updated with `{{TEST_BOOTSTRAP}}` and `{{REVIEW_DASHBOARD}}`.
+- WebSearch added to allowed-tools for qa, ship, qa-design-review.
+- 26 new validation tests, 2 new E2E evals (bootstrap + coverage audit).
+- 2 new P3 TODOs: CI/CD for non-GitHub providers, auto-upgrade weak tests.
+
 ## 0.5.4 — 2026-03-17
 
 - **Engineering review is always the full review now.** `/plan-eng-review` no longer asks you to choose between "big change" and "small change" modes. Every plan gets the full interactive walkthrough (architecture, code quality, tests, performance). Scope reduction is only suggested when the complexity check actually triggers — not as a standing menu option.
diff --git a/TODOS.md b/TODOS.md
index f52bb693..a0801d85 100644
--- a/TODOS.md
+++ b/TODOS.md
@@ -263,6 +263,30 @@
 **Effort:** S
 **Priority:** P3
 
+### CI/CD generation for non-GitHub providers
+
+**What:** Extend CI/CD bootstrap to generate GitLab CI (`.gitlab-ci.yml`), CircleCI (`.circleci/config.yml`), and Bitrise pipelines.
+
+**Why:** Not all projects use GitHub Actions. Universal CI/CD bootstrap would make test bootstrap work for everyone.
+
+**Context:** v1 ships with GitHub Actions only. Detection logic already checks for `.gitlab-ci.yml`, `.circleci/`, `bitrise.yml` and skips with an informational note. Each provider needs ~20 lines of template text in `generateTestBootstrap()`.
+
+**Effort:** M
+**Priority:** P3
+**Depends on:** Test bootstrap (shipped)
+
+### Auto-upgrade weak tests (★) to strong tests (★★★)
+
+**What:** When Step 3.4 coverage audit identifies existing ★-rated tests (smoke/trivial assertions), generate improved versions testing edge cases and error paths.
+
+**Why:** Many codebases have tests that technically exist but don't catch real bugs — `expect(component).toBeDefined()` isn't testing behavior. Upgrading these closes the gap between "has tests" and "has good tests."
+
+**Context:** Requires the quality scoring rubric from the test coverage audit. Modifying existing test files is riskier than creating new ones — needs careful diffing to ensure the upgraded test still passes. Consider creating a companion test file rather than modifying the original.
+
+**Effort:** M
+**Priority:** P3
+**Depends on:** Test quality scoring (shipped)
+
 ## Retro
 
 ### Deployment health tracking (retro + browse)
diff --git a/VERSION b/VERSION
index 7d856835..a918a2aa 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.5.4
+0.6.0
diff --git a/qa-design-review/SKILL.md b/qa-design-review/SKILL.md
index 0d8d0771..7044c560 100644
--- a/qa-design-review/SKILL.md
+++ b/qa-design-review/SKILL.md
@@ -14,6 +14,7 @@ allowed-tools:
   - Glob
   - Grep
   - AskUserQuestion
+  - WebSearch
 ---
 <!-- AUTO-GENERATED from SKILL.md.tmpl — do not edit directly -->
 <!-- Regenerate: bun run gen:skill-docs -->
@@ -136,6 +137,161 @@ If `NEEDS_SETUP`:
 2. Run: `cd <SKILL_DIR> && ./setup`
 3. If `bun` is not installed: `curl -fsSL https://bun.sh/install | bash`
 
+**Check test framework (bootstrap if needed):**
+
+## Test Framework Bootstrap
+
+**Detect existing test framework and project runtime:**
+
+```bash
+# Detect project runtime
+[ -f Gemfile ] && echo "RUNTIME:ruby"
+[ -f package.json ] && echo "RUNTIME:node"
+[ -f requirements.txt ] || [ -f pyproject.toml ] && echo "RUNTIME:python"
+[ -f go.mod ] && echo "RUNTIME:go"
+[ -f Cargo.toml ] && echo "RUNTIME:rust"
+[ -f composer.json ] && echo "RUNTIME:php"
+[ -f mix.exs ] && echo "RUNTIME:elixir"
+# Detect sub-frameworks
+[ -f Gemfile ] && grep -q "rails" Gemfile 2>/dev/null && echo "FRAMEWORK:rails"
+[ -f package.json ] && grep -q '"next"' package.json 2>/dev/null && echo "FRAMEWORK:nextjs"
+# Check for existing test infrastructure
+ls jest.config.* vitest.config.* playwright.config.* .rspec pytest.ini pyproject.toml phpunit.xml 2>/dev/null
+ls -d test/ tests/ spec/ __tests__/ cypress/ e2e/ 2>/dev/null
+# Check opt-out marker
+[ -f .gstack/no-test-bootstrap ] && echo "BOOTSTRAP_DECLINED"
+```
+
+**If test framework detected** (config files or test directories found):
+Print "Test framework detected: {name} ({N} existing tests). Skipping bootstrap."
+Read 2-3 existing test files to learn conventions (naming, imports, assertion style, setup patterns).
+Store conventions as prose context for use in Phase 8e.5 or Step 3.4. **Skip the rest of bootstrap.**
+
+**If BOOTSTRAP_DECLINED** appears: Print "Test bootstrap previously declined — skipping." **Skip the rest of bootstrap.**
+
+**If NO runtime detected** (no config files found): Use AskUserQuestion:
+"I couldn't detect your project's language. What runtime are you using?"
+Options: A) Node.js/TypeScript B) Ruby/Rails C) Python D) Go E) Rust F) PHP G) Elixir H) This project doesn't need tests.
+If user picks H → write `.gstack/no-test-bootstrap` and continue without tests.
+
+**If runtime detected but no test framework — bootstrap:**
+
+### B2. Research best practices
+
+Use WebSearch to find current best practices for the detected runtime:
+- `"[runtime] best test framework 2025 2026"`
+- `"[framework A] vs [framework B] comparison"`
+
+If WebSearch is unavailable, use this built-in knowledge table:
+
+| Runtime | Primary recommendation | Alternative |
+|---------|----------------------|-------------|
+| Ruby/Rails | minitest + fixtures + capybara | rspec + factory_bot + shoulda-matchers |
+| Node.js | vitest + @testing-library | jest + @testing-library |
+| Next.js | vitest + @testing-library/react + playwright | jest + cypress |
+| Python | pytest + pytest-cov | unittest |
+| Go | stdlib testing + testify | stdlib only |
+| Rust | cargo test (built-in) + mockall | — |
+| PHP | phpunit + mockery | pest |
+| Elixir | ExUnit (built-in) + ex_machina | — |
+
+### B3. Framework selection
+
+Use AskUserQuestion:
+"I detected this is a [Runtime/Framework] project with no test framework. I researched current best practices. Here are the options:
+A) [Primary] — [rationale]. Includes: [packages]. Supports: unit, integration, smoke, e2e
+B) [Alternative] — [rationale]. Includes: [packages]
+C) Skip — don't set up testing right now
+RECOMMENDATION: Choose A because [reason based on project context]"
+
+If user picks C → write `.gstack/no-test-bootstrap`. Tell user: "If you change your mind later, delete `.gstack/no-test-bootstrap` and re-run." Continue without tests.
+
+If multiple runtimes detected (monorepo) → ask which runtime to set up first, with option to do both sequentially.
+
+### B4. Install and configure
+
+1. Install the chosen packages (npm/bun/gem/pip/etc.)
+2. Create minimal config file
+3. Create directory structure (test/, spec/, etc.)
+4. Create one example test matching the project's code to verify setup works
+
+If package installation fails → debug once. If still failing → revert with `git checkout -- package.json package-lock.json` (or equivalent for the runtime). Warn user and continue without tests.
+
+### B4.5. First real tests
+
+Generate 3-5 real tests for existing code:
+
+1. **Find recently changed files:** `git log --since=30.days --name-only --format="" | sort | uniq -c | sort -rn | head -10`
+2. **Prioritize by risk:** Error handlers > business logic with conditionals > API endpoints > pure functions
+3. **For each file:** Write one test that tests real behavior with meaningful assertions. Never `expect(x).toBeDefined()` — test what the code DOES.
+4. Run each test. Passes → keep. Fails → fix once. Still fails → delete silently.
+5. Generate at least 1 test, cap at 5.
+
+Never import secrets, API keys, or credentials in test files. Use environment variables or test fixtures.
+
+### B5. Verify
+
+```bash
+# Run the full test suite to confirm everything works
+{detected test command}
+```
+
+If tests fail → debug once. If still failing → revert all bootstrap changes and warn user.
+
+### B5.5. CI/CD pipeline
+
+```bash
+# Check CI provider
+ls -d .github/ 2>/dev/null && echo "CI:github"
+ls .gitlab-ci.yml .circleci/ bitrise.yml 2>/dev/null
+```
+
+If `.github/` exists (or no CI detected — default to GitHub Actions):
+Create `.github/workflows/test.yml` with:
+- `runs-on: ubuntu-latest`
+- Appropriate setup action for the runtime (setup-node, setup-ruby, setup-python, etc.)
+- The same test command verified in B5
+- Trigger: push + pull_request
+
+If non-GitHub CI detected → skip CI generation with note: "Detected {provider} — CI pipeline generation supports GitHub Actions only. Add test step to your existing pipeline manually."
+
+### B6. Create TESTING.md
+
+First check: If TESTING.md already exists → read it and update/append rather than overwriting. Never destroy existing content.
+
+Write TESTING.md with:
+- Philosophy: "100% test coverage is the key to great vibe coding. Tests let you move fast, trust your instincts, and ship with confidence — without them, vibe coding is just yolo coding. With tests, it's a superpower."
+- Framework name and version
+- How to run tests (the verified command from B5)
+- Test layers: Unit tests (what, where, when), Integration tests, Smoke tests, E2E tests
+- Conventions: file naming, assertion style, setup/teardown patterns
+
+### B7. Update CLAUDE.md
+
+First check: If CLAUDE.md already has a `## Testing` section → skip. Don't duplicate.
+
+Append a `## Testing` section:
+- Run command and test directory
+- Reference to TESTING.md
+- Test expectations:
+  - 100% test coverage is the goal — tests make vibe coding safe
+  - When writing new functions, write a corresponding test
+  - When fixing a bug, write a regression test
+  - When adding error handling, write a test that triggers the error
+  - When adding a conditional (if/else, switch), write tests for BOTH paths
+  - Never commit code that makes existing tests fail
+
+### B8. Commit
+
+```bash
+git status --porcelain
+```
+
+Only commit if there are changes. Stage all bootstrap files (config, test directory, TESTING.md, CLAUDE.md, .github/workflows/test.yml if created):
+`git commit -m "chore: bootstrap test framework ({framework name})"`
+
+---
+
 **Create output directories:**
 
 ```bash
@@ -565,6 +721,18 @@ Take **before/after screenshot pair** for every fix.
 - **best-effort**: fix applied but couldn't fully verify (e.g., needs specific browser state)
 - **reverted**: regression detected → `git revert HEAD` → mark finding as "deferred"
 
+### 8e.5. Regression Test (design-review variant)
+
+Design fixes are typically CSS-only. Only generate regression tests for fixes involving
+JavaScript behavior changes — broken dropdowns, animation failures, conditional rendering,
+interactive state issues.
+
+For CSS-only fixes: skip entirely. CSS regressions are caught by re-running /qa-design-review.
+
+If the fix involved JS behavior: follow the same procedure as /qa Phase 8e.5 (study existing
+test patterns, write a regression test encoding the exact bug condition, run it, commit if
+passes or defer if fails). Commit format: `test(design): regression test for FINDING-NNN`.
+
 ### 8f. Self-Regulation (STOP AND EVALUATE)
 
 Every 5 fixes (or after any revert), compute the design-fix risk level:
@@ -639,7 +807,7 @@ If the repo has a `TODOS.md`:
 
 11. **Clean working tree required.** Refuse to start if `git status --porcelain` is non-empty.
 12. **One commit per fix.** Never bundle multiple design fixes into one commit.
-13. **Never modify tests or CI configuration.** Only fix application source code and styles.
+13. **Only modify tests when generating regression tests in Phase 8e.5.** Never modify CI configuration. Never modify existing tests — only create new test files.
 14. **Revert on regression.** If a fix makes things worse, `git revert HEAD` immediately.
 15. **Self-regulate.** Follow the design-fix risk heuristic. When in doubt, stop and ask.
 16. **CSS-first.** Prefer CSS/styling changes over structural component changes. CSS-only changes are safer and more reversible.
diff --git a/qa-design-review/SKILL.md.tmpl b/qa-design-review/SKILL.md.tmpl
index 0053a494..5969fb52 100644
--- a/qa-design-review/SKILL.md.tmpl
+++ b/qa-design-review/SKILL.md.tmpl
@@ -14,6 +14,7 @@ allowed-tools:
   - Glob
   - Grep
   - AskUserQuestion
+  - WebSearch
 ---
 
 {{PREAMBLE}}
@@ -54,6 +55,10 @@ fi
 
 {{BROWSE_SETUP}}
 
+**Check test framework (bootstrap if needed):**
+
+{{TEST_BOOTSTRAP}}
+
 **Create output directories:**
 
 ```bash
@@ -153,6 +158,18 @@ Take **before/after screenshot pair** for every fix.
 - **best-effort**: fix applied but couldn't fully verify (e.g., needs specific browser state)
 - **reverted**: regression detected → `git revert HEAD` → mark finding as "deferred"
 
+### 8e.5. Regression Test (design-review variant)
+
+Design fixes are typically CSS-only. Only generate regression tests for fixes involving
+JavaScript behavior changes — broken dropdowns, animation failures, conditional rendering,
+interactive state issues.
+
+For CSS-only fixes: skip entirely. CSS regressions are caught by re-running /qa-design-review.
+
+If the fix involved JS behavior: follow the same procedure as /qa Phase 8e.5 (study existing
+test patterns, write a regression test encoding the exact bug condition, run it, commit if
+passes or defer if fails). Commit format: `test(design): regression test for FINDING-NNN`.
+
 ### 8f. Self-Regulation (STOP AND EVALUATE)
 
 Every 5 fixes (or after any revert), compute the design-fix risk level:
@@ -227,7 +244,7 @@ If the repo has a `TODOS.md`:
 
 11. **Clean working tree required.** Refuse to start if `git status --porcelain` is non-empty.
 12. **One commit per fix.** Never bundle multiple design fixes into one commit.
-13. **Never modify tests or CI configuration.** Only fix application source code and styles.
+13. **Only modify tests when generating regression tests in Phase 8e.5.** Never modify CI configuration. Never modify existing tests — only create new test files.
 14. **Revert on regression.** If a fix makes things worse, `git revert HEAD` immediately.
 15. **Self-regulate.** Follow the design-fix risk heuristic. When in doubt, stop and ask.
 16. **CSS-first.** Prefer CSS/styling changes over structural component changes. CSS-only changes are safer and more reversible.
diff --git a/qa-only/SKILL.md b/qa-only/SKILL.md
index 36f5fead..4fa0cf04 100644
--- a/qa-only/SKILL.md
+++ b/qa-only/SKILL.md
@@ -452,3 +452,4 @@ Report filenames use the domain and date: `qa-report-myapp-com-2026-03-12.md`
 ## Additional Rules (qa-only specific)
 
 11. **Never fix bugs.** Find and document only. Do not read source code, edit files, or suggest fixes in the report. Your job is to report what's broken, not to fix it. Use `/qa` for the test-fix-verify loop.
+12. **No test framework detected?** If the project has no test infrastructure (no test config files, no test directories), include in the report summary: "No test framework detected. Run `/qa` to bootstrap one and enable regression test generation."
diff --git a/qa-only/SKILL.md.tmpl b/qa-only/SKILL.md.tmpl
index 101cd71c..831e71ed 100644
--- a/qa-only/SKILL.md.tmpl
+++ b/qa-only/SKILL.md.tmpl
@@ -97,3 +97,4 @@ Report filenames use the domain and date: `qa-report-myapp-com-2026-03-12.md`
 ## Additional Rules (qa-only specific)
 
 11. **Never fix bugs.** Find and document only. Do not read source code, edit files, or suggest fixes in the report. Your job is to report what's broken, not to fix it. Use `/qa` for the test-fix-verify loop.
+12. **No test framework detected?** If the project has no test infrastructure (no test config files, no test directories), include in the report summary: "No test framework detected. Run `/qa` to bootstrap one and enable regression test generation."
diff --git a/qa/SKILL.md b/qa/SKILL.md
index 9bd8fc9b..c01514cf 100644
--- a/qa/SKILL.md
+++ b/qa/SKILL.md
@@ -16,6 +16,7 @@ allowed-tools:
   - Glob
   - Grep
   - AskUserQuestion
+  - WebSearch
 ---
 <!-- AUTO-GENERATED from SKILL.md.tmpl — do not edit directly -->
 <!-- Regenerate: bun run gen:skill-docs -->
@@ -157,6 +158,161 @@ If `NEEDS_SETUP`:
 2. Run: `cd <SKILL_DIR> && ./setup`
 3. If `bun` is not installed: `curl -fsSL https://bun.sh/install | bash`
 
+**Check test framework (bootstrap if needed):**
+
+## Test Framework Bootstrap
+
+**Detect existing test framework and project runtime:**
+
+```bash
+# Detect project runtime
+[ -f Gemfile ] && echo "RUNTIME:ruby"
+[ -f package.json ] && echo "RUNTIME:node"
+[ -f requirements.txt ] || [ -f pyproject.toml ] && echo "RUNTIME:python"
+[ -f go.mod ] && echo "RUNTIME:go"
+[ -f Cargo.toml ] && echo "RUNTIME:rust"
+[ -f composer.json ] && echo "RUNTIME:php"
+[ -f mix.exs ] && echo "RUNTIME:elixir"
+# Detect sub-frameworks
+[ -f Gemfile ] && grep -q "rails" Gemfile 2>/dev/null && echo "FRAMEWORK:rails"
+[ -f package.json ] && grep -q '"next"' package.json 2>/dev/null && echo "FRAMEWORK:nextjs"
+# Check for existing test infrastructure
+ls jest.config.* vitest.config.* playwright.config.* .rspec pytest.ini pyproject.toml phpunit.xml 2>/dev/null
+ls -d test/ tests/ spec/ __tests__/ cypress/ e2e/ 2>/dev/null
+# Check opt-out marker
+[ -f .gstack/no-test-bootstrap ] && echo "BOOTSTRAP_DECLINED"
+```
+
+**If test framework detected** (config files or test directories found):
+Print "Test framework detected: {name} ({N} existing tests). Skipping bootstrap."
+Read 2-3 existing test files to learn conventions (naming, imports, assertion style, setup patterns).
+Store conventions as prose context for use in Phase 8e.5 or Step 3.4. **Skip the rest of bootstrap.**
+
+**If BOOTSTRAP_DECLINED** appears: Print "Test bootstrap previously declined — skipping." **Skip the rest of bootstrap.**
+
+**If NO runtime detected** (no config files found): Use AskUserQuestion:
+"I couldn't detect your project's language. What runtime are you using?"
+Options: A) Node.js/TypeScript B) Ruby/Rails C) Python D) Go E) Rust F) PHP G) Elixir H) This project doesn't need tests.
+If user picks H → write `.gstack/no-test-bootstrap` and continue without tests.
+
+**If runtime detected but no test framework — bootstrap:**
+
+### B2. Research best practices
+
+Use WebSearch to find current best practices for the detected runtime:
+- `"[runtime] best test framework 2025 2026"`
+- `"[framework A] vs [framework B] comparison"`
+
+If WebSearch is unavailable, use this built-in knowledge table:
+
+| Runtime | Primary recommendation | Alternative |
+|---------|----------------------|-------------|
+| Ruby/Rails | minitest + fixtures + capybara | rspec + factory_bot + shoulda-matchers |
+| Node.js | vitest + @testing-library | jest + @testing-library |
+| Next.js | vitest + @testing-library/react + playwright | jest + cypress |
+| Python | pytest + pytest-cov | unittest |
+| Go | stdlib testing + testify | stdlib only |
+| Rust | cargo test (built-in) + mockall | — |
+| PHP | phpunit + mockery | pest |
+| Elixir | ExUnit (built-in) + ex_machina | — |
+
+### B3. Framework selection
+
+Use AskUserQuestion:
+"I detected this is a [Runtime/Framework] project with no test framework. I researched current best practices. Here are the options:
+A) [Primary] — [rationale]. Includes: [packages]. Supports: unit, integration, smoke, e2e
+B) [Alternative] — [rationale]. Includes: [packages]
+C) Skip — don't set up testing right now
+RECOMMENDATION: Choose A because [reason based on project context]"
+
+If user picks C → write `.gstack/no-test-bootstrap`. Tell user: "If you change your mind later, delete `.gstack/no-test-bootstrap` and re-run." Continue without tests.
+
+If multiple runtimes detected (monorepo) → ask which runtime to set up first, with option to do both sequentially.
+
+### B4. Install and configure
+
+1. Install the chosen packages (npm/bun/gem/pip/etc.)
+2. Create minimal config file
+3. Create directory structure (test/, spec/, etc.)
+4. Create one example test matching the project's code to verify setup works
+
+If package installation fails → debug once. If still failing → revert with `git checkout -- package.json package-lock.json` (or equivalent for the runtime). Warn user and continue without tests.
+
+### B4.5. First real tests
+
+Generate 3-5 real tests for existing code:
+
+1. **Find recently changed files:** `git log --since=30.days --name-only --format="" | sort | uniq -c | sort -rn | head -10`
+2. **Prioritize by risk:** Error handlers > business logic with conditionals > API endpoints > pure functions
+3. **For each file:** Write one test that tests real behavior with meaningful assertions. Never `expect(x).toBeDefined()` — test what the code DOES.
+4. Run each test. Passes → keep. Fails → fix once. Still fails → delete silently.
+5. Generate at least 1 test, cap at 5.
+
+Never import secrets, API keys, or credentials in test files. Use environment variables or test fixtures.
+
+### B5. Verify
+
+```bash
+# Run the full test suite to confirm everything works
+{detected test command}
+```
+
+If tests fail → debug once. If still failing → revert all bootstrap changes and warn user.
+
+### B5.5. CI/CD pipeline
+
+```bash
+# Check CI provider
+ls -d .github/ 2>/dev/null && echo "CI:github"
+ls .gitlab-ci.yml .circleci/ bitrise.yml 2>/dev/null
+```
+
+If `.github/` exists (or no CI detected — default to GitHub Actions):
+Create `.github/workflows/test.yml` with:
+- `runs-on: ubuntu-latest`
+- Appropriate setup action for the runtime (setup-node, setup-ruby, setup-python, etc.)
+- The same test command verified in B5
+- Trigger: push + pull_request
+
+If non-GitHub CI detected → skip CI generation with note: "Detected {provider} — CI pipeline generation supports GitHub Actions only. Add test step to your existing pipeline manually."
+
+### B6. Create TESTING.md
+
+First check: If TESTING.md already exists → read it and update/append rather than overwriting. Never destroy existing content.
+
+Write TESTING.md with:
+- Philosophy: "100% test coverage is the key to great vibe coding. Tests let you move fast, trust your instincts, and ship with confidence — without them, vibe coding is just yolo coding. With tests, it's a superpower."
+- Framework name and version
+- How to run tests (the verified command from B5)
+- Test layers: Unit tests (what, where, when), Integration tests, Smoke tests, E2E tests
+- Conventions: file naming, assertion style, setup/teardown patterns
+
+### B7. Update CLAUDE.md
+
+First check: If CLAUDE.md already has a `## Testing` section → skip. Don't duplicate.
+
+Append a `## Testing` section:
+- Run command and test directory
+- Reference to TESTING.md
+- Test expectations:
+  - 100% test coverage is the goal — tests make vibe coding safe
+  - When writing new functions, write a corresponding test
+  - When fixing a bug, write a regression test
+  - When adding error handling, write a test that triggers the error
+  - When adding a conditional (if/else, switch), write tests for BOTH paths
+  - Never commit code that makes existing tests fail
+
+### B8. Commit
+
+```bash
+git status --porcelain
+```
+
+Only commit if there are changes. Stage all bootstrap files (config, test directory, TESTING.md, CLAUDE.md, .github/workflows/test.yml if created):
+`git commit -m "chore: bootstrap test framework ({framework name})"`
+
+---
+
 **Create output directories:**
 
 ```bash
@@ -541,6 +697,59 @@ $B snapshot -D
 - **best-effort**: fix applied but couldn't fully verify (e.g., needs auth state, external service)
 - **reverted**: regression detected → `git revert HEAD` → mark issue as "deferred"
 
+### 8e.5. Regression Test
+
+Skip if: classification is not "verified", OR the fix is purely visual/CSS with no JS behavior, OR no test framework was detected AND user declined bootstrap.
+
+**1. Study the project's existing test patterns:**
+
+Read 2-3 test files closest to the fix (same directory, same code type). Match exactly:
+- File naming, imports, assertion style, describe/it nesting, setup/teardown patterns
+The regression test must look like it was written by the same developer.
+
+**2. Trace the bug's codepath, then write a regression test:**
+
+Before writing the test, trace the data flow through the code you just fixed:
+- What input/state triggered the bug? (the exact precondition)
+- What codepath did it follow? (which branches, which function calls)
+- Where did it break? (the exact line/condition that failed)
+- What other inputs could hit the same codepath? (edge cases around the fix)
+
+The test MUST:
+- Set up the precondition that triggered the bug (the exact state that made it break)
+- Perform the action that exposed the bug
+- Assert the correct behavior (NOT "it renders" or "it doesn't throw")
+- If you found adjacent edge cases while tracing, test those too (e.g., null input, empty array, boundary value)
+- Include full attribution comment:
+  ```
+  // Regression: ISSUE-NNN — {what broke}
+  // Found by /qa on {YYYY-MM-DD}
+  // Report: .gstack/qa-reports/qa-report-{domain}-{date}.md
+  ```
+
+Test type decision:
+- Console error / JS exception / logic bug → unit or integration test
+- Broken form / API failure / data flow bug → integration test with request/response
+- Visual bug with JS behavior (broken dropdown, animation) → component test
+- Pure CSS → skip (caught by QA reruns)
+
+Generate unit tests. Mock all external dependencies (DB, API, Redis, file system).
+
+Use auto-incrementing names to avoid collisions: check existing `{name}.regression-*.test.{ext}` files, take max number + 1.
+
+**3. Run only the new test file:**
+
+```bash
+{detected test command} {new-test-file}
+```
+
+**4. Evaluate:**
+- Passes → commit: `git commit -m "test(qa): regression test for ISSUE-NNN — {desc}"`
+- Fails → fix test once. Still failing → delete test, defer.
+- Taking >2 min exploration → skip and defer.
+
+**5. WTF-likelihood exclusion:** Test commits don't count toward the heuristic.
+
 ### 8f. Self-Regulation (STOP AND EVALUATE)
 
 Every 5 fixes (or after any revert), compute the WTF-likelihood:
@@ -614,6 +823,6 @@ If the repo has a `TODOS.md`:
 
 11. **Clean working tree required.** Refuse to start if `git status --porcelain` is non-empty.
 12. **One commit per fix.** Never bundle multiple fixes into one commit.
-13. **Never modify tests or CI configuration.** Only fix application source code.
+13. **Only modify tests when generating regression tests in Phase 8e.5.** Never modify CI configuration. Never modify existing tests — only create new test files.
 14. **Revert on regression.** If a fix makes things worse, `git revert HEAD` immediately.
 15. **Self-regulate.** Follow the WTF-likelihood heuristic. When in doubt, stop and ask.
diff --git a/qa/SKILL.md.tmpl b/qa/SKILL.md.tmpl
index 45dfbea6..bd94debe 100644
--- a/qa/SKILL.md.tmpl
+++ b/qa/SKILL.md.tmpl
@@ -16,6 +16,7 @@ allowed-tools:
   - Glob
   - Grep
   - AskUserQuestion
+  - WebSearch
 ---
 
 {{PREAMBLE}}
@@ -58,6 +59,10 @@ fi
 
 {{BROWSE_SETUP}}
 
+**Check test framework (bootstrap if needed):**
+
+{{TEST_BOOTSTRAP}}
+
 **Create output directories:**
 
 ```bash
@@ -169,6 +174,59 @@ $B snapshot -D
 - **best-effort**: fix applied but couldn't fully verify (e.g., needs auth state, external service)
 - **reverted**: regression detected → `git revert HEAD` → mark issue as "deferred"
 
+### 8e.5. Regression Test
+
+Skip if: classification is not "verified", OR the fix is purely visual/CSS with no JS behavior, OR no test framework was detected AND user declined bootstrap.
+
+**1. Study the project's existing test patterns:**
+
+Read 2-3 test files closest to the fix (same directory, same code type). Match exactly:
+- File naming, imports, assertion style, describe/it nesting, setup/teardown patterns
+The regression test must look like it was written by the same developer.
+
+**2. Trace the bug's codepath, then write a regression test:**
+
+Before writing the test, trace the data flow through the code you just fixed:
+- What input/state triggered the bug? (the exact precondition)
+- What codepath did it follow? (which branches, which function calls)
+- Where did it break? (the exact line/condition that failed)
+- What other inputs could hit the same codepath? (edge cases around the fix)
+
+The test MUST:
+- Set up the precondition that triggered the bug (the exact state that made it break)
+- Perform the action that exposed the bug
+- Assert the correct behavior (NOT "it renders" or "it doesn't throw")
+- If you found adjacent edge cases while tracing, test those too (e.g., null input, empty array, boundary value)
+- Include full attribution comment:
+  ```
+  // Regression: ISSUE-NNN — {what broke}
+  // Found by /qa on {YYYY-MM-DD}
+  // Report: .gstack/qa-reports/qa-report-{domain}-{date}.md
+  ```
+
+Test type decision:
+- Console error / JS exception / logic bug → unit or integration test
+- Broken form / API failure / data flow bug → integration test with request/response
+- Visual bug with JS behavior (broken dropdown, animation) → component test
+- Pure CSS → skip (caught by QA reruns)
+
+Generate unit tests. Mock all external dependencies (DB, API, Redis, file system).
+
+Use auto-incrementing names to avoid collisions: check existing `{name}.regression-*.test.{ext}` files, take max number + 1.
+
+**3. Run only the new test file:**
+
+```bash
+{detected test command} {new-test-file}
+```
+
+**4. Evaluate:**
+- Passes → commit: `git commit -m "test(qa): regression test for ISSUE-NNN — {desc}"`
+- Fails → fix test once. Still failing → delete test, defer.
+- Taking >2 min exploration → skip and defer.
+
+**5. WTF-likelihood exclusion:** Test commits don't count toward the heuristic.
+
 ### 8f. Self-Regulation (STOP AND EVALUATE)
 
 Every 5 fixes (or after any revert), compute the WTF-likelihood:
@@ -242,6 +300,6 @@ If the repo has a `TODOS.md`:
 
 11. **Clean working tree required.** Refuse to start if `git status --porcelain` is non-empty.
 12. **One commit per fix.** Never bundle multiple fixes into one commit.
-13. **Never modify tests or CI configuration.** Only fix application source code.
+13. **Only modify tests when generating regression tests in Phase 8e.5.** Never modify CI configuration. Never modify existing tests — only create new test files.
 14. **Revert on regression.** If a fix makes things worse, `git revert HEAD` immediately.
 15. **Self-regulate.** Follow the WTF-likelihood heuristic. When in doubt, stop and ask.
diff --git a/qa/templates/qa-report-template.md b/qa/templates/qa-report-template.md
index 5466bda4..6aa30943 100644
--- a/qa/templates/qa-report-template.md
+++ b/qa/templates/qa-report-template.md
@@ -86,6 +86,22 @@
 
 ---
 
+## Regression Tests
+
+| Issue | Test File | Status | Description |
+|-------|-----------|--------|-------------|
+| ISSUE-NNN | path/to/test | committed / deferred / skipped | description |
+
+### Deferred Tests
+
+#### ISSUE-NNN: {title}
+**Precondition:** {setup state that triggers the bug}
+**Action:** {what the user does}
+**Expected:** {correct behavior}
+**Why deferred:** {reason}
+
+---
+
 ## Ship Readiness
 
 | Metric | Value |
diff --git a/retro/SKILL.md b/retro/SKILL.md
index c7781525..e7cd3d2c 100644
--- a/retro/SKILL.md
+++ b/retro/SKILL.md
@@ -164,6 +164,15 @@ cat ~/.gstack/greptile-history.md 2>/dev/null || true
 
 # 9. TODOS.md backlog (if available)
 cat TODOS.md 2>/dev/null || true
+
+# 10. Test file count
+find . -name '*.test.*' -o -name '*.spec.*' -o -name '*_test.*' -o -name '*_spec.*' 2>/dev/null | grep -v node_modules | wc -l
+
+# 11. Regression test commits in window
+git log origin/<default> --since="<window>" --oneline --grep="test(qa):" --grep="test(design):" --grep="test: coverage"
+
+# 12. Test files changed in window
+git log origin/<default> --since="<window>" --format="" --name-only | grep -E '\.(test|spec)\.' | sort -u | wc -l
 ```
 
 ### Step 2: Compute Metrics
@@ -185,6 +194,7 @@ Calculate and present these metrics in a summary table:
 | Detected sessions | N |
 | Avg LOC/session-hour | N |
 | Greptile signal | N% (Y catches, Z FPs) |
+| Test Health | N total tests · M added this period · K regression tests |
 
 Then show a **per-author leaderboard** immediately below:
 
@@ -408,7 +418,17 @@ Use the Write tool to save the JSON file with this schema:
 }
 ```
 
-**Note:** Only include the `greptile` field if `~/.gstack/greptile-history.md` exists and has entries within the time window. Only include the `backlog` field if `TODOS.md` exists. If either has no data, omit the field entirely.
+**Note:** Only include the `greptile` field if `~/.gstack/greptile-history.md` exists and has entries within the time window. Only include the `backlog` field if `TODOS.md` exists. Only include the `test_health` field if test files were found (command 10 returns > 0). If any has no data, omit the field entirely.
+
+Include test health data in the JSON when test files exist:
+```json
+  "test_health": {
+    "total_test_files": 47,
+    "tests_added_this_period": 5,
+    "regression_test_commits": 3,
+    "test_files_changed": 8
+  }
+```
 
 Include backlog data in the JSON when TODOS.md exists:
 ```json
@@ -464,6 +484,13 @@ Narrative covering:
 - Any XL PRs that should have been split
 - Greptile signal ratio and trend (if history exists): "Greptile: X% signal (Y valid catches, Z false positives)"
 
+### Test Health
+- Total test files: N (from command 10)
+- Tests added this period: M (from command 12 — test files changed)
+- Regression test commits: list `test(qa):` and `test(design):` and `test: coverage` commits from command 11
+- If prior retro exists and has `test_health`: show delta "Test count: {last} → {now} (+{delta})"
+- If test ratio < 20%: flag as growth area — "100% test coverage is the goal. Tests make vibe coding safe."
+
 ### Focus & Highlights
 (from Step 8)
 - Focus score with interpretation
diff --git a/retro/SKILL.md.tmpl b/retro/SKILL.md.tmpl
index 2f39fb5c..bfbc2003 100644
--- a/retro/SKILL.md.tmpl
+++ b/retro/SKILL.md.tmpl
@@ -99,6 +99,15 @@ cat ~/.gstack/greptile-history.md 2>/dev/null || true
 
 # 9. TODOS.md backlog (if available)
 cat TODOS.md 2>/dev/null || true
+
+# 10. Test file count
+find . -name '*.test.*' -o -name '*.spec.*' -o -name '*_test.*' -o -name '*_spec.*' 2>/dev/null | grep -v node_modules | wc -l
+
+# 11. Regression test commits in window
+git log origin/<default> --since="<window>" --oneline --grep="test(qa):" --grep="test(design):" --grep="test: coverage"
+
+# 12. Test files changed in window
+git log origin/<default> --since="<window>" --format="" --name-only | grep -E '\.(test|spec)\.' | sort -u | wc -l
 ```
 
 ### Step 2: Compute Metrics
@@ -120,6 +129,7 @@ Calculate and present these metrics in a summary table:
 | Detected sessions | N |
 | Avg LOC/session-hour | N |
 | Greptile signal | N% (Y catches, Z FPs) |
+| Test Health | N total tests · M added this period · K regression tests |
 
 Then show a **per-author leaderboard** immediately below:
 
@@ -343,7 +353,17 @@ Use the Write tool to save the JSON file with this schema:
 }
 ```
 
-**Note:** Only include the `greptile` field if `~/.gstack/greptile-history.md` exists and has entries within the time window. Only include the `backlog` field if `TODOS.md` exists. If either has no data, omit the field entirely.
+**Note:** Only include the `greptile` field if `~/.gstack/greptile-history.md` exists and has entries within the time window. Only include the `backlog` field if `TODOS.md` exists. Only include the `test_health` field if test files were found (command 10 returns > 0). If any has no data, omit the field entirely.
+
+Include test health data in the JSON when test files exist:
+```json
+  "test_health": {
+    "total_test_files": 47,
+    "tests_added_this_period": 5,
+    "regression_test_commits": 3,
+    "test_files_changed": 8
+  }
+```
 
 Include backlog data in the JSON when TODOS.md exists:
 ```json
@@ -399,6 +419,13 @@ Narrative covering:
 - Any XL PRs that should have been split
 - Greptile signal ratio and trend (if history exists): "Greptile: X% signal (Y valid catches, Z false positives)"
 
+### Test Health
+- Total test files: N (from command 10)
+- Tests added this period: M (from command 12 — test files changed)
+- Regression test commits: list `test(qa):` and `test(design):` and `test: coverage` commits from command 11
+- If prior retro exists and has `test_health`: show delta "Test count: {last} → {now} (+{delta})"
+- If test ratio < 20%: flag as growth area — "100% test coverage is the goal. Tests make vibe coding safe."
+
 ### Focus & Highlights
 (from Step 8)
 - Focus score with interpretation
diff --git a/scripts/gen-skill-docs.ts b/scripts/gen-skill-docs.ts
index ee8a1c09..31684e21 100644
--- a/scripts/gen-skill-docs.ts
+++ b/scripts/gen-skill-docs.ts
@@ -854,6 +854,161 @@ Parse the output. Find the most recent entry for each skill (plan-ceo-review, pl
 - If \\\`skip_eng_review\\\` config is \\\`true\\\`, Eng Review shows "SKIPPED (global)" and verdict is CLEARED`;
 }
 
+function generateTestBootstrap(): string {
+  return `## Test Framework Bootstrap
+
+**Detect existing test framework and project runtime:**
+
+\`\`\`bash
+# Detect project runtime
+[ -f Gemfile ] && echo "RUNTIME:ruby"
+[ -f package.json ] && echo "RUNTIME:node"
+[ -f requirements.txt ] || [ -f pyproject.toml ] && echo "RUNTIME:python"
+[ -f go.mod ] && echo "RUNTIME:go"
+[ -f Cargo.toml ] && echo "RUNTIME:rust"
+[ -f composer.json ] && echo "RUNTIME:php"
+[ -f mix.exs ] && echo "RUNTIME:elixir"
+# Detect sub-frameworks
+[ -f Gemfile ] && grep -q "rails" Gemfile 2>/dev/null && echo "FRAMEWORK:rails"
+[ -f package.json ] && grep -q '"next"' package.json 2>/dev/null && echo "FRAMEWORK:nextjs"
+# Check for existing test infrastructure
+ls jest.config.* vitest.config.* playwright.config.* .rspec pytest.ini pyproject.toml phpunit.xml 2>/dev/null
+ls -d test/ tests/ spec/ __tests__/ cypress/ e2e/ 2>/dev/null
+# Check opt-out marker
+[ -f .gstack/no-test-bootstrap ] && echo "BOOTSTRAP_DECLINED"
+\`\`\`
+
+**If test framework detected** (config files or test directories found):
+Print "Test framework detected: {name} ({N} existing tests). Skipping bootstrap."
+Read 2-3 existing test files to learn conventions (naming, imports, assertion style, setup patterns).
+Store conventions as prose context for use in Phase 8e.5 or Step 3.4. **Skip the rest of bootstrap.**
+
+**If BOOTSTRAP_DECLINED** appears: Print "Test bootstrap previously declined — skipping." **Skip the rest of bootstrap.**
+
+**If NO runtime detected** (no config files found): Use AskUserQuestion:
+"I couldn't detect your project's language. What runtime are you using?"
+Options: A) Node.js/TypeScript B) Ruby/Rails C) Python D) Go E) Rust F) PHP G) Elixir H) This project doesn't need tests.
+If user picks H → write \`.gstack/no-test-bootstrap\` and continue without tests.
+
+**If runtime detected but no test framework — bootstrap:**
+
+### B2. Research best practices
+
+Use WebSearch to find current best practices for the detected runtime:
+- \`"[runtime] best test framework 2025 2026"\`
+- \`"[framework A] vs [framework B] comparison"\`
+
+If WebSearch is unavailable, use this built-in knowledge table:
+
+| Runtime | Primary recommendation | Alternative |
+|---------|----------------------|-------------|
+| Ruby/Rails | minitest + fixtures + capybara | rspec + factory_bot + shoulda-matchers |
+| Node.js | vitest + @testing-library | jest + @testing-library |
+| Next.js | vitest + @testing-library/react + playwright | jest + cypress |
+| Python | pytest + pytest-cov | unittest |
+| Go | stdlib testing + testify | stdlib only |
+| Rust | cargo test (built-in) + mockall | — |
+| PHP | phpunit + mockery | pest |
+| Elixir | ExUnit (built-in) + ex_machina | — |
+
+### B3. Framework selection
+
+Use AskUserQuestion:
+"I detected this is a [Runtime/Framework] project with no test framework. I researched current best practices. Here are the options:
+A) [Primary] — [rationale]. Includes: [packages]. Supports: unit, integration, smoke, e2e
+B) [Alternative] — [rationale]. Includes: [packages]
+C) Skip — don't set up testing right now
+RECOMMENDATION: Choose A because [reason based on project context]"
+
+If user picks C → write \`.gstack/no-test-bootstrap\`. Tell user: "If you change your mind later, delete \`.gstack/no-test-bootstrap\` and re-run." Continue without tests.
+
+If multiple runtimes detected (monorepo) → ask which runtime to set up first, with option to do both sequentially.
+
+### B4. Install and configure
+
+1. Install the chosen packages (npm/bun/gem/pip/etc.)
+2. Create minimal config file
+3. Create directory structure (test/, spec/, etc.)
+4. Create one example test matching the project's code to verify setup works
+
+If package installation fails → debug once. If still failing → revert with \`git checkout -- package.json package-lock.json\` (or equivalent for the runtime). Warn user and continue without tests.
+
+### B4.5. First real tests
+
+Generate 3-5 real tests for existing code:
+
+1. **Find recently changed files:** \`git log --since=30.days --name-only --format="" | sort | uniq -c | sort -rn | head -10\`
+2. **Prioritize by risk:** Error handlers > business logic with conditionals > API endpoints > pure functions
+3. **For each file:** Write one test that tests real behavior with meaningful assertions. Never \`expect(x).toBeDefined()\` — test what the code DOES.
+4. Run each test. Passes → keep. Fails → fix once. Still fails → delete silently.
+5. Generate at least 1 test, cap at 5.
+
+Never import secrets, API keys, or credentials in test files. Use environment variables or test fixtures.
+
+### B5. Verify
+
+\`\`\`bash
+# Run the full test suite to confirm everything works
+{detected test command}
+\`\`\`
+
+If tests fail → debug once. If still failing → revert all bootstrap changes and warn user.
+
+### B5.5. CI/CD pipeline
+
+\`\`\`bash
+# Check CI provider
+ls -d .github/ 2>/dev/null && echo "CI:github"
+ls .gitlab-ci.yml .circleci/ bitrise.yml 2>/dev/null
+\`\`\`
+
+If \`.github/\` exists (or no CI detected — default to GitHub Actions):
+Create \`.github/workflows/test.yml\` with:
+- \`runs-on: ubuntu-latest\`
+- Appropriate setup action for the runtime (setup-node, setup-ruby, setup-python, etc.)
+- The same test command verified in B5
+- Trigger: push + pull_request
+
+If non-GitHub CI detected → skip CI generation with note: "Detected {provider} — CI pipeline generation supports GitHub Actions only. Add test step to your existing pipeline manually."
+
+### B6. Create TESTING.md
+
+First check: If TESTING.md already exists → read it and update/append rather than overwriting. Never destroy existing content.
+
+Write TESTING.md with:
+- Philosophy: "100% test coverage is the key to great vibe coding. Tests let you move fast, trust your instincts, and ship with confidence — without them, vibe coding is just yolo coding. With tests, it's a superpower."
+- Framework name and version
+- How to run tests (the verified command from B5)
+- Test layers: Unit tests (what, where, when), Integration tests, Smoke tests, E2E tests
+- Conventions: file naming, assertion style, setup/teardown patterns
+
+### B7. Update CLAUDE.md
+
+First check: If CLAUDE.md already has a \`## Testing\` section → skip. Don't duplicate.
+
+Append a \`## Testing\` section:
+- Run command and test directory
+- Reference to TESTING.md
+- Test expectations:
+  - 100% test coverage is the goal — tests make vibe coding safe
+  - When writing new functions, write a corresponding test
+  - When fixing a bug, write a regression test
+  - When adding error handling, write a test that triggers the error
+  - When adding a conditional (if/else, switch), write tests for BOTH paths
+  - Never commit code that makes existing tests fail
+
+### B8. Commit
+
+\`\`\`bash
+git status --porcelain
+\`\`\`
+
+Only commit if there are changes. Stage all bootstrap files (config, test directory, TESTING.md, CLAUDE.md, .github/workflows/test.yml if created):
+\`git commit -m "chore: bootstrap test framework ({framework name})"\`
+
+---`;
+}
+
 const RESOLVERS: Record<string, () => string> = {
   COMMAND_REFERENCE: generateCommandReference,
   SNAPSHOT_FLAGS: generateSnapshotFlags,
@@ -863,6 +1018,7 @@ const RESOLVERS: Record<string, () => string> = {
   QA_METHODOLOGY: generateQAMethodology,
   DESIGN_METHODOLOGY: generateDesignMethodology,
   REVIEW_DASHBOARD: generateReviewDashboard,
+  TEST_BOOTSTRAP: generateTestBootstrap,
 };
 
 // ─── Template Processing ────────────────────────────────────
diff --git a/ship/SKILL.md b/ship/SKILL.md
index dc1a86a2..32582088 100644
--- a/ship/SKILL.md
+++ b/ship/SKILL.md
@@ -11,6 +11,7 @@ allowed-tools:
   - Grep
   - Glob
   - AskUserQuestion
+  - WebSearch
 ---
 <!-- AUTO-GENERATED from SKILL.md.tmpl — do not edit directly -->
 <!-- Regenerate: bun run gen:skill-docs -->
@@ -121,6 +122,7 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 - Multi-file changesets (auto-split into bisectable commits)
 - TODOS.md completed-item detection (auto-mark)
 - Auto-fixable review findings (dead code, N+1, stale comments — fixed automatically)
+- Test coverage gaps (auto-generate and commit, or flag in PR body)
 
 ---
 
@@ -210,6 +212,163 @@ git fetch origin <base> && git merge origin/<base> --no-edit
 
 ---
 
+## Step 2.5: Test Framework Bootstrap
+
+## Test Framework Bootstrap
+
+**Detect existing test framework and project runtime:**
+
+```bash
+# Detect project runtime
+[ -f Gemfile ] && echo "RUNTIME:ruby"
+[ -f package.json ] && echo "RUNTIME:node"
+[ -f requirements.txt ] || [ -f pyproject.toml ] && echo "RUNTIME:python"
+[ -f go.mod ] && echo "RUNTIME:go"
+[ -f Cargo.toml ] && echo "RUNTIME:rust"
+[ -f composer.json ] && echo "RUNTIME:php"
+[ -f mix.exs ] && echo "RUNTIME:elixir"
+# Detect sub-frameworks
+[ -f Gemfile ] && grep -q "rails" Gemfile 2>/dev/null && echo "FRAMEWORK:rails"
+[ -f package.json ] && grep -q '"next"' package.json 2>/dev/null && echo "FRAMEWORK:nextjs"
+# Check for existing test infrastructure
+ls jest.config.* vitest.config.* playwright.config.* .rspec pytest.ini pyproject.toml phpunit.xml 2>/dev/null
+ls -d test/ tests/ spec/ __tests__/ cypress/ e2e/ 2>/dev/null
+# Check opt-out marker
+[ -f .gstack/no-test-bootstrap ] && echo "BOOTSTRAP_DECLINED"
+```
+
+**If test framework detected** (config files or test directories found):
+Print "Test framework detected: {name} ({N} existing tests). Skipping bootstrap."
+Read 2-3 existing test files to learn conventions (naming, imports, assertion style, setup patterns).
+Store conventions as prose context for use in Phase 8e.5 or Step 3.4. **Skip the rest of bootstrap.**
+
+**If BOOTSTRAP_DECLINED** appears: Print "Test bootstrap previously declined — skipping." **Skip the rest of bootstrap.**
+
+**If NO runtime detected** (no config files found): Use AskUserQuestion:
+"I couldn't detect your project's language. What runtime are you using?"
+Options: A) Node.js/TypeScript B) Ruby/Rails C) Python D) Go E) Rust F) PHP G) Elixir H) This project doesn't need tests.
+If user picks H → write `.gstack/no-test-bootstrap` and continue without tests.
+
+**If runtime detected but no test framework — bootstrap:**
+
+### B2. Research best practices
+
+Use WebSearch to find current best practices for the detected runtime:
+- `"[runtime] best test framework 2025 2026"`
+- `"[framework A] vs [framework B] comparison"`
+
+If WebSearch is unavailable, use this built-in knowledge table:
+
+| Runtime | Primary recommendation | Alternative |
+|---------|----------------------|-------------|
+| Ruby/Rails | minitest + fixtures + capybara | rspec + factory_bot + shoulda-matchers |
+| Node.js | vitest + @testing-library | jest + @testing-library |
+| Next.js | vitest + @testing-library/react + playwright | jest + cypress |
+| Python | pytest + pytest-cov | unittest |
+| Go | stdlib testing + testify | stdlib only |
+| Rust | cargo test (built-in) + mockall | — |
+| PHP | phpunit + mockery | pest |
+| Elixir | ExUnit (built-in) + ex_machina | — |
+
+### B3. Framework selection
+
+Use AskUserQuestion:
+"I detected this is a [Runtime/Framework] project with no test framework. I researched current best practices. Here are the options:
+A) [Primary] — [rationale]. Includes: [packages]. Supports: unit, integration, smoke, e2e
+B) [Alternative] — [rationale]. Includes: [packages]
+C) Skip — don't set up testing right now
+RECOMMENDATION: Choose A because [reason based on project context]"
+
+If user picks C → write `.gstack/no-test-bootstrap`. Tell user: "If you change your mind later, delete `.gstack/no-test-bootstrap` and re-run." Continue without tests.
+
+If multiple runtimes detected (monorepo) → ask which runtime to set up first, with option to do both sequentially.
+
+### B4. Install and configure
+
+1. Install the chosen packages (npm/bun/gem/pip/etc.)
+2. Create minimal config file
+3. Create directory structure (test/, spec/, etc.)
+4. Create one example test matching the project's code to verify setup works
+
+If package installation fails → debug once. If still failing → revert with `git checkout -- package.json package-lock.json` (or equivalent for the runtime). Warn user and continue without tests.
+
+### B4.5. First real tests
+
+Generate 3-5 real tests for existing code:
+
+1. **Find recently changed files:** `git log --since=30.days --name-only --format="" | sort | uniq -c | sort -rn | head -10`
+2. **Prioritize by risk:** Error handlers > business logic with conditionals > API endpoints > pure functions
+3. **For each file:** Write one test that tests real behavior with meaningful assertions. Never `expect(x).toBeDefined()` — test what the code DOES.
+4. Run each test. Passes → keep. Fails → fix once. Still fails → delete silently.
+5. Generate at least 1 test, cap at 5.
+
+Never import secrets, API keys, or credentials in test files. Use environment variables or test fixtures.
+
+### B5. Verify
+
+```bash
+# Run the full test suite to confirm everything works
+{detected test command}
+```
+
+If tests fail → debug once. If still failing → revert all bootstrap changes and warn user.
+
+### B5.5. CI/CD pipeline
+
+```bash
+# Check CI provider
+ls -d .github/ 2>/dev/null && echo "CI:github"
+ls .gitlab-ci.yml .circleci/ bitrise.yml 2>/dev/null
+```
+
+If `.github/` exists (or no CI detected — default to GitHub Actions):
+Create `.github/workflows/test.yml` with:
+- `runs-on: ubuntu-latest`
+- Appropriate setup action for the runtime (setup-node, setup-ruby, setup-python, etc.)
+- The same test command verified in B5
+- Trigger: push + pull_request
+
+If non-GitHub CI detected → skip CI generation with note: "Detected {provider} — CI pipeline generation supports GitHub Actions only. Add test step to your existing pipeline manually."
+
+### B6. Create TESTING.md
+
+First check: If TESTING.md already exists → read it and update/append rather than overwriting. Never destroy existing content.
+
+Write TESTING.md with:
+- Philosophy: "100% test coverage is the key to great vibe coding. Tests let you move fast, trust your instincts, and ship with confidence — without them, vibe coding is just yolo coding. With tests, it's a superpower."
+- Framework name and version
+- How to run tests (the verified command from B5)
+- Test layers: Unit tests (what, where, when), Integration tests, Smoke tests, E2E tests
+- Conventions: file naming, assertion style, setup/teardown patterns
+
+### B7. Update CLAUDE.md
+
+First check: If CLAUDE.md already has a `## Testing` section → skip. Don't duplicate.
+
+Append a `## Testing` section:
+- Run command and test directory
+- Reference to TESTING.md
+- Test expectations:
+  - 100% test coverage is the goal — tests make vibe coding safe
+  - When writing new functions, write a corresponding test
+  - When fixing a bug, write a regression test
+  - When adding error handling, write a test that triggers the error
+  - When adding a conditional (if/else, switch), write tests for BOTH paths
+  - Never commit code that makes existing tests fail
+
+### B8. Commit
+
+```bash
+git status --porcelain
+```
+
+Only commit if there are changes. Stage all bootstrap files (config, test directory, TESTING.md, CLAUDE.md, .github/workflows/test.yml if created):
+`git commit -m "chore: bootstrap test framework ({framework name})"`
+
+---
+
+---
+
 ## Step 3: Run tests (on merged code)
 
 **Do NOT run `RAILS_ENV=test bin/rails db:migrate`** — `bin/test-lane` already calls
@@ -294,6 +453,144 @@ If multiple suites need to run, run them sequentially (each needs a test lane).
 
 ---
 
+## Step 3.4: Test Coverage Audit
+
+100% coverage is the goal — every untested path is a path where bugs hide and vibe coding becomes yolo coding. Evaluate what was ACTUALLY coded (from the diff), not what was planned.
+
+**0. Before/after test count:**
+
+```bash
+# Count test files before any generation
+find . -name '*.test.*' -o -name '*.spec.*' -o -name '*_test.*' -o -name '*_spec.*' | grep -v node_modules | wc -l
+```
+
+Store this number for the PR body.
+
+**1. Trace every codepath changed** using `git diff origin/<base>...HEAD`:
+
+Read every changed file. For each one, trace how data flows through the code — don't just list functions, actually follow the execution:
+
+1. **Read the diff.** For each changed file, read the full file (not just the diff hunk) to understand context.
+2. **Trace data flow.** Starting from each entry point (route handler, exported function, event listener, component render), follow the data through every branch:
+   - Where does input come from? (request params, props, database, API call)
+   - What transforms it? (validation, mapping, computation)
+   - Where does it go? (database write, API response, rendered output, side effect)
+   - What can go wrong at each step? (null/undefined, invalid input, network failure, empty collection)
+3. **Diagram the execution.** For each changed file, draw an ASCII diagram showing:
+   - Every function/method that was added or modified
+   - Every conditional branch (if/else, switch, ternary, guard clause, early return)
+   - Every error path (try/catch, rescue, error boundary, fallback)
+   - Every call to another function (trace into it — does IT have untested branches?)
+   - Every edge: what happens with null input? Empty array? Invalid type?
+
+This is the critical step — you're building a map of every line of code that can execute differently based on input. Every branch in this diagram needs a test.
+
+**2. Map user flows, interactions, and error states:**
+
+Code coverage isn't enough — you need to cover how real users interact with the changed code. For each changed feature, think through:
+
+- **User flows:** What sequence of actions does a user take that touches this code? Map the full journey (e.g., "user clicks 'Pay' → form validates → API call → success/failure screen"). Each step in the journey needs a test.
+- **Interaction edge cases:** What happens when the user does something unexpected?
+  - Double-click/rapid resubmit
+  - Navigate away mid-operation (back button, close tab, click another link)
+  - Submit with stale data (page sat open for 30 minutes, session expired)
+  - Slow connection (API takes 10 seconds — what does the user see?)
+  - Concurrent actions (two tabs, same form)
+- **Error states the user can see:** For every error the code handles, what does the user actually experience?
+  - Is there a clear error message or a silent failure?
+  - Can the user recover (retry, go back, fix input) or are they stuck?
+  - What happens with no network? With a 500 from the API? With invalid data from the server?
+- **Empty/zero/boundary states:** What does the UI show with zero results? With 10,000 results? With a single character input? With maximum-length input?
+
+Add these to your diagram alongside the code branches. A user flow with no test is just as much a gap as an untested if/else.
+
+**3. Check each branch against existing tests:**
+
+Go through your diagram branch by branch — both code paths AND user flows. For each one, search for a test that exercises it:
+- Function `processPayment()` → look for `billing.test.ts`, `billing.spec.ts`, `test/billing_test.rb`
+- An if/else → look for tests covering BOTH the true AND false path
+- An error handler → look for a test that triggers that specific error condition
+- A call to `helperFn()` that has its own branches → those branches need tests too
+- A user flow → look for an integration or E2E test that walks through the journey
+- An interaction edge case → look for a test that simulates the unexpected action
+
+Quality scoring rubric:
+- ★★★  Tests behavior with edge cases AND error paths
+- ★★   Tests correct behavior, happy path only
+- ★    Smoke test / existence check / trivial assertion (e.g., "it renders", "it doesn't throw")
+
+**4. Output ASCII coverage diagram:**
+
+Include BOTH code paths and user flows in the same diagram:
+
+```
+CODE PATH COVERAGE
+===========================
+[+] src/services/billing.ts
+    │
+    ├── processPayment()
+    │   ├── [★★★ TESTED] Happy path + card declined + timeout — billing.test.ts:42
+    │   ├── [GAP]         Network timeout — NO TEST
+    │   └── [GAP]         Invalid currency — NO TEST
+    │
+    └── refundPayment()
+        ├── [★★  TESTED] Full refund — billing.test.ts:89
+        └── [★   TESTED] Partial refund (checks non-throw only) — billing.test.ts:101
+
+USER FLOW COVERAGE
+===========================
+[+] Payment checkout flow
+    │
+    ├── [★★★ TESTED] Complete purchase — checkout.e2e.ts:15
+    ├── [GAP]         Double-click submit — NO TEST
+    ├── [GAP]         Navigate away during payment — NO TEST
+    └── [★   TESTED] Form validation errors (checks render only) — checkout.test.ts:40
+
+[+] Error states
+    │
+    ├── [★★  TESTED] Card declined message — billing.test.ts:58
+    ├── [GAP]         Network timeout UX (what does user see?) — NO TEST
+    └── [GAP]         Empty cart submission — NO TEST
+
+─────────────────────────────────
+COVERAGE: 5/12 paths tested (42%)
+  Code paths: 3/5 (60%)
+  User flows: 2/7 (29%)
+QUALITY:  ★★★: 2  ★★: 2  ★: 1
+GAPS: 7 paths need tests
+─────────────────────────────────
+```
+
+**Fast path:** All paths covered → "Step 3.4: All new code paths have test coverage ✓" Continue.
+
+**5. Generate tests for uncovered paths:**
+
+If test framework detected (or bootstrapped in Step 2.5):
+- Prioritize error handlers and edge cases first (happy paths are more likely already tested)
+- Read 2-3 existing test files to match conventions exactly
+- Generate unit tests. Mock all external dependencies (DB, API, Redis).
+- Write tests that exercise the specific uncovered path with real assertions
+- Run each test. Passes → commit as `test: coverage for {feature}`
+- Fails → fix once. Still fails → revert, note gap in diagram.
+
+Caps: 30 code paths max, 20 tests generated max (code + user flow combined), 2-min per-test exploration cap.
+
+If no test framework AND user declined bootstrap → diagram only, no generation. Note: "Test generation skipped — no test framework configured."
+
+**Diff is test-only changes:** Skip Step 3.4 entirely: "No new application code paths to audit."
+
+**6. After-count and coverage summary:**
+
+```bash
+# Count test files after generation
+find . -name '*.test.*' -o -name '*.spec.*' -o -name '*_test.*' -o -name '*_spec.*' | grep -v node_modules | wc -l
+```
+
+For PR body: `Tests: {before} → {after} (+{delta} new)`
+Coverage line: `Test Coverage Audit: N new code paths. M covered (X%). K tests generated, J committed.`
+
+---
+
 ## Step 3.5: Pre-Landing Review
 
 Review the diff for structural issues that tests don't catch.
@@ -522,6 +819,10 @@ gh pr create --base <base> --title "<type>: <summary>" --body "$(cat <<'EOF'
 ## Summary
 <bullet points from CHANGELOG>
 
+## Test Coverage
+<coverage diagram from Step 3.4, or "All new code paths have test coverage.">
+<If Step 3.4 ran: "Tests: {before} → {after} (+{delta} new)">
+
 ## Pre-Landing Review
 <findings from Step 3.5, or "No issues found.">
 
@@ -563,4 +864,5 @@ EOF
 - **Split commits for bisectability** — each commit = one logical change.
 - **TODOS.md completion detection must be conservative.** Only mark items as completed when the diff clearly shows the work is done.
 - **Use Greptile reply templates from greptile-triage.md.** Every reply includes evidence (inline diff, code references, re-rank suggestion). Never post vague replies.
+- **Step 3.4 generates coverage tests.** They must pass before committing. Never commit failing tests.
 - **The goal is: user says `/ship`, next thing they see is the review + PR URL.**
diff --git a/ship/SKILL.md.tmpl b/ship/SKILL.md.tmpl
index bb6db158..e059fc6a 100644
--- a/ship/SKILL.md.tmpl
+++ b/ship/SKILL.md.tmpl
@@ -11,6 +11,7 @@ allowed-tools:
   - Grep
   - Glob
   - AskUserQuestion
+  - WebSearch
 ---
 
 {{PREAMBLE}}
@@ -39,6 +40,7 @@ You are running the `/ship` workflow. This is a **non-interactive, fully automat
 - Multi-file changesets (auto-split into bisectable commits)
 - TODOS.md completed-item detection (auto-mark)
 - Auto-fixable review findings (dead code, N+1, stale comments — fixed automatically)
+- Test coverage gaps (auto-generate and commit, or flag in PR body)
 
 ---
 
@@ -92,6 +94,12 @@ git fetch origin <base> && git merge origin/<base> --no-edit
 
 ---
 
+## Step 2.5: Test Framework Bootstrap
+
+{{TEST_BOOTSTRAP}}
+
+---
+
 ## Step 3: Run tests (on merged code)
 
 **Do NOT run `RAILS_ENV=test bin/rails db:migrate`** — `bin/test-lane` already calls
@@ -176,6 +184,144 @@ If multiple suites need to run, run them sequentially (each needs a test lane).
 
 ---
 
+## Step 3.4: Test Coverage Audit
+
+100% coverage is the goal — every untested path is a path where bugs hide and vibe coding becomes yolo coding. Evaluate what was ACTUALLY coded (from the diff), not what was planned.
+
+**0. Before/after test count:**
+
+```bash
+# Count test files before any generation
+find . -name '*.test.*' -o -name '*.spec.*' -o -name '*_test.*' -o -name '*_spec.*' | grep -v node_modules | wc -l
+```
+
+Store this number for the PR body.
+
+**1. Trace every codepath changed** using `git diff origin/<base>...HEAD`:
+
+Read every changed file. For each one, trace how data flows through the code — don't just list functions, actually follow the execution:
+
+1. **Read the diff.** For each changed file, read the full file (not just the diff hunk) to understand context.
+2. **Trace data flow.** Starting from each entry point (route handler, exported function, event listener, component render), follow the data through every branch:
+   - Where does input come from? (request params, props, database, API call)
+   - What transforms it? (validation, mapping, computation)
+   - Where does it go? (database write, API response, rendered output, side effect)
+   - What can go wrong at each step? (null/undefined, invalid input, network failure, empty collection)
+3. **Diagram the execution.** For each changed file, draw an ASCII diagram showing:
+   - Every function/method that was added or modified
+   - Every conditional branch (if/else, switch, ternary, guard clause, early return)
+   - Every error path (try/catch, rescue, error boundary, fallback)
+   - Every call to another function (trace into it — does IT have untested branches?)
+   - Every edge: what happens with null input? Empty array? Invalid type?
+
+This is the critical step — you're building a map of every line of code that can execute differently based on input. Every branch in this diagram needs a test.
+
+**2. Map user flows, interactions, and error states:**
+
+Code coverage isn't enough — you need to cover how real users interact with the changed code. For each changed feature, think through:
+
+- **User flows:** What sequence of actions does a user take that touches this code? Map the full journey (e.g., "user clicks 'Pay' → form validates → API call → success/failure screen"). Each step in the journey needs a test.
+- **Interaction edge cases:** What happens when the user does something unexpected?
+  - Double-click/rapid resubmit
+  - Navigate away mid-operation (back button, close tab, click another link)
+  - Submit with stale data (page sat open for 30 minutes, session expired)
+  - Slow connection (API takes 10 seconds — what does the user see?)
+  - Concurrent actions (two tabs, same form)
+- **Error states the user can see:** For every error the code handles, what does the user actually experience?
+  - Is there a clear error message or a silent failure?
+  - Can the user recover (retry, go back, fix input) or are they stuck?
+  - What happens with no network? With a 500 from the API? With invalid data from the server?
+- **Empty/zero/boundary states:** What does the UI show with zero results? With 10,000 results? With a single character input? With maximum-length input?
+
+Add these to your diagram alongside the code branches. A user flow with no test is just as much a gap as an untested if/else.
+
+**3. Check each branch against existing tests:**
+
+Go through your diagram branch by branch — both code paths AND user flows. For each one, search for a test that exercises it:
+- Function `processPayment()` → look for `billing.test.ts`, `billing.spec.ts`, `test/billing_test.rb`
+- An if/else → look for tests covering BOTH the true AND false path
+- An error handler → look for a test that triggers that specific error condition
+- A call to `helperFn()` that has its own branches → those branches need tests too
+- A user flow → look for an integration or E2E test that walks through the journey
+- An interaction edge case → look for a test that simulates the unexpected action
+
+Quality scoring rubric:
+- ★★★  Tests behavior with edge cases AND error paths
+- ★★   Tests correct behavior, happy path only
+- ★    Smoke test / existence check / trivial assertion (e.g., "it renders", "it doesn't throw")
+
+**4. Output ASCII coverage diagram:**
+
+Include BOTH code paths and user flows in the same diagram:
+
+```
+CODE PATH COVERAGE
+===========================
+[+] src/services/billing.ts
+    │
+    ├── processPayment()
+    │   ├── [★★★ TESTED] Happy path + card declined + timeout — billing.test.ts:42
+    │   ├── [GAP]         Network timeout — NO TEST
+    │   └── [GAP]         Invalid currency — NO TEST
+    │
+    └── refundPayment()
+        ├── [★★  TESTED] Full refund — billing.test.ts:89
+        └── [★   TESTED] Partial refund (checks non-throw only) — billing.test.ts:101
+
+USER FLOW COVERAGE
+===========================
+[+] Payment checkout flow
+    │
+    ├── [★★★ TESTED] Complete purchase — checkout.e2e.ts:15
+    ├── [GAP]         Double-click submit — NO TEST
+    ├── [GAP]         Navigate away during payment — NO TEST
+    └── [★   TESTED] Form validation errors (checks render only) — checkout.test.ts:40
+
+[+] Error states
+    │
+    ├── [★★  TESTED] Card declined message — billing.test.ts:58
+    ├── [GAP]         Network timeout UX (what does user see?) — NO TEST
+    └── [GAP]         Empty cart submission — NO TEST
+
+─────────────────────────────────
+COVERAGE: 5/12 paths tested (42%)
+  Code paths: 3/5 (60%)
+  User flows: 2/7 (29%)
+QUALITY:  ★★★: 2  ★★: 2  ★: 1
+GAPS: 7 paths need tests
+─────────────────────────────────
+```
+
+**Fast path:** All paths covered → "Step 3.4: All new code paths have test coverage ✓" Continue.
+
+**5. Generate tests for uncovered paths:**
+
+If test framework detected (or bootstrapped in Step 2.5):
+- Prioritize error handlers and edge cases first (happy paths are more likely already tested)
+- Read 2-3 existing test files to match conventions exactly
+- Generate unit tests. Mock all external dependencies (DB, API, Redis).
+- Write tests that exercise the specific uncovered path with real assertions
+- Run each test. Passes → commit as `test: coverage for {feature}`
+- Fails → fix once. Still fails → revert, note gap in diagram.
+
+Caps: 30 code paths max, 20 tests generated max (code + user flow combined), 2-min per-test exploration cap.
+
+If no test framework AND user declined bootstrap → diagram only, no generation. Note: "Test generation skipped — no test framework configured."
+
+**Diff is test-only changes:** Skip Step 3.4 entirely: "No new application code paths to audit."
+
+**6. After-count and coverage summary:**
+
+```bash
+# Count test files after generation
+find . -name '*.test.*' -o -name '*.spec.*' -o -name '*_test.*' -o -name '*_spec.*' | grep -v node_modules | wc -l
+```
+
+For PR body: `Tests: {before} → {after} (+{delta} new)`
+Coverage line: `Test Coverage Audit: N new code paths. M covered (X%). K tests generated, J committed.`
+
+---
+
 ## Step 3.5: Pre-Landing Review
 
 Review the diff for structural issues that tests don't catch.
@@ -404,6 +550,10 @@ gh pr create --base <base> --title "<type>: <summary>" --body "$(cat <<'EOF'
 ## Summary
 <bullet points from CHANGELOG>
 
+## Test Coverage
+<coverage diagram from Step 3.4, or "All new code paths have test coverage.">
+<If Step 3.4 ran: "Tests: {before} → {after} (+{delta} new)">
+
 ## Pre-Landing Review
 <findings from Step 3.5, or "No issues found.">
 
@@ -445,4 +595,5 @@ EOF
 - **Split commits for bisectability** — each commit = one logical change.
 - **TODOS.md completion detection must be conservative.** Only mark items as completed when the diff clearly shows the work is done.
 - **Use Greptile reply templates from greptile-triage.md.** Every reply includes evidence (inline diff, code references, re-rank suggestion). Never post vague replies.
+- **Step 3.4 generates coverage tests.** They must pass before committing. Never commit failing tests.
 - **The goal is: user says `/ship`, next thing they see is the review + PR URL.**
diff --git a/test/skill-e2e.test.ts b/test/skill-e2e.test.ts
index e50f688e..2ea56da9 100644
--- a/test/skill-e2e.test.ts
+++ b/test/skill-e2e.test.ts
@@ -2298,6 +2298,269 @@ Review the site at ${serverUrl}. Use --quick mode. Skip any AskUserQuestion call
   }, 420_000);
 });
 
+// --- Test Bootstrap E2E ---
+
+describeE2E('Test Bootstrap E2E', () => {
+  let bootstrapDir: string;
+  let bootstrapServer: ReturnType<typeof Bun.serve>;
+
+  beforeAll(() => {
+    bootstrapDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-bootstrap-'));
+    setupBrowseShims(bootstrapDir);
+
+    // Copy qa skill files
+    copyDirSync(path.join(ROOT, 'qa'), path.join(bootstrapDir, 'qa'));
+
+    // Create a minimal Node.js project with NO test framework
+    fs.writeFileSync(path.join(bootstrapDir, 'package.json'), JSON.stringify({
+      name: 'test-bootstrap-app',
+      version: '1.0.0',
+      type: 'module',
+    }, null, 2));
+
+    // Create a simple app file with a bug
+    fs.writeFileSync(path.join(bootstrapDir, 'app.js'), `
+export function add(a, b) { return a + b; }
+export function subtract(a, b) { return a - b; }
+export function divide(a, b) { return a / b; } // BUG: no zero check
+`);
+
+    // Create a simple HTML page with a bug
+    fs.writeFileSync(path.join(bootstrapDir, 'index.html'), `<!DOCTYPE html>
+<html lang="en">
+<head><meta charset="utf-8"><title>Bootstrap Test</title></head>
+<body>
+  <h1>Test App</h1>
+  <a href="/nonexistent-page">Broken Link</a>
+  <script>console.error("ReferenceError: undefinedVar is not defined");</script>
+</body>
+</html>
+`);
+
+    // Init git repo
+    const run = (cmd: string, args: string[]) =>
+      spawnSync(cmd, args, { cwd: bootstrapDir, stdio: 'pipe', timeout: 5000 });
+    run('git', ['init']);
+    run('git', ['config', 'user.email', 'test@test.com']);
+    run('git', ['config', 'user.name', 'Test']);
+    run('git', ['add', '.']);
+    run('git', ['commit', '-m', 'initial commit']);
+
+    // Serve from working directory
+    bootstrapServer = Bun.serve({
+      port: 0,
+      hostname: '127.0.0.1',
+      fetch(req) {
+        const url = new URL(req.url);
+        let filePath = url.pathname === '/' ? '/index.html' : url.pathname;
+        filePath = filePath.replace(/^\//, '');
+        const fullPath = path.join(bootstrapDir, filePath);
+        if (!fs.existsSync(fullPath)) {
+          return new Response('Not Found', { status: 404 });
+        }
+        const content = fs.readFileSync(fullPath, 'utf-8');
+        return new Response(content, {
+          headers: { 'Content-Type': 'text/html' },
+        });
+      },
+    });
+  });
+
+  afterAll(() => {
+    bootstrapServer?.stop();
+    try { fs.rmSync(bootstrapDir, { recursive: true, force: true }); } catch {}
+  });
+
+  test('/qa bootstrap + regression test on zero-test project', async () => {
+    const serverUrl = `http://127.0.0.1:${bootstrapServer!.port}`;
+
+    const result = await runSkillTest({
+      prompt: `You have a browse binary at ${browseBin}. Assign it to B variable like: B="${browseBin}"
+
+Read the file qa/SKILL.md for the QA workflow instructions.
+
+Run a Quick-tier QA test on ${serverUrl}
+The source code for this page is at ${bootstrapDir}/index.html — you can fix bugs there.
+Do NOT use AskUserQuestion — for any AskUserQuestion prompts, choose the RECOMMENDED option automatically.
+Write your report to ${bootstrapDir}/qa-reports/qa-report.md
+
+This project has NO test framework. When the bootstrap asks, pick vitest (option A).
+This is a test+fix loop: find bugs, fix them, write regression tests, commit each fix.`,
+      workingDirectory: bootstrapDir,
+      maxTurns: 50,
+      allowedTools: ['Bash', 'Read', 'Write', 'Edit', 'Glob', 'Grep'],
+      timeout: 420_000,
+      testName: 'qa-bootstrap',
+      runId,
+    });
+
+    logCost('/qa bootstrap', result);
+    recordE2E('/qa bootstrap + regression test', 'Test Bootstrap E2E', result, {
+      passed: ['success', 'error_max_turns'].includes(result.exitReason),
+    });
+
+    expect(['success', 'error_max_turns']).toContain(result.exitReason);
+
+    // Verify bootstrap created test infrastructure
+    const hasTestConfig = fs.existsSync(path.join(bootstrapDir, 'vitest.config.ts'))
+      || fs.existsSync(path.join(bootstrapDir, 'vitest.config.js'))
+      || fs.existsSync(path.join(bootstrapDir, 'jest.config.js'))
+      || fs.existsSync(path.join(bootstrapDir, 'jest.config.ts'));
+    console.log(`Test config created: ${hasTestConfig}`);
+
+    const hasTestingMd = fs.existsSync(path.join(bootstrapDir, 'TESTING.md'));
+    console.log(`TESTING.md created: ${hasTestingMd}`);
+
+    // Check for bootstrap commit
+    const gitLog = spawnSync('git', ['log', '--oneline', '--grep=bootstrap'], {
+      cwd: bootstrapDir, stdio: 'pipe',
+    });
+    const bootstrapCommits = gitLog.stdout.toString().trim();
+    console.log(`Bootstrap commits: ${bootstrapCommits || 'none'}`);
+
+    // Check for regression test commits
+    const regressionLog = spawnSync('git', ['log', '--oneline', '--grep=test(qa)'], {
+      cwd: bootstrapDir, stdio: 'pipe',
+    });
+    const regressionCommits = regressionLog.stdout.toString().trim();
+    console.log(`Regression test commits: ${regressionCommits || 'none'}`);
+
+    // Verify at least the bootstrap happened (fix commits are bonus)
+    const allCommits = spawnSync('git', ['log', '--oneline'], {
+      cwd: bootstrapDir, stdio: 'pipe',
+    });
+    const totalCommits = allCommits.stdout.toString().trim().split('\n').length;
+    console.log(`Total commits: ${totalCommits}`);
+    expect(totalCommits).toBeGreaterThan(1); // At least initial + bootstrap
+  }, 420_000);
+});
+
+// --- Test Coverage Audit E2E ---
+
+describeE2E('Test Coverage Audit E2E', () => {
+  let coverageDir: string;
+
+  beforeAll(() => {
+    coverageDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-coverage-'));
+
+    // Copy ship skill files
+    copyDirSync(path.join(ROOT, 'ship'), path.join(coverageDir, 'ship'));
+    copyDirSync(path.join(ROOT, 'review'), path.join(coverageDir, 'review'));
+
+    // Create a Node.js project WITH test framework but coverage gaps
+    fs.writeFileSync(path.join(coverageDir, 'package.json'), JSON.stringify({
+      name: 'test-coverage-app',
+      version: '1.0.0',
+      type: 'module',
+      scripts: { test: 'echo "no tests yet"' },
+      devDependencies: { vitest: '^1.0.0' },
+    }, null, 2));
+
+    // Create vitest config
+    fs.writeFileSync(path.join(coverageDir, 'vitest.config.ts'),
+      `import { defineConfig } from 'vitest/config';\nexport default defineConfig({ test: {} });\n`);
+
+    fs.writeFileSync(path.join(coverageDir, 'VERSION'), '0.1.0.0\n');
+    fs.writeFileSync(path.join(coverageDir, 'CHANGELOG.md'), '# Changelog\n');
+
+    // Create source file with multiple code paths
+    fs.mkdirSync(path.join(coverageDir, 'src'), { recursive: true });
+    fs.writeFileSync(path.join(coverageDir, 'src', 'billing.ts'), `
+export function processPayment(amount: number, currency: string) {
+  if (amount <= 0) throw new Error('Invalid amount');
+  if (currency !== 'USD' && currency !== 'EUR') throw new Error('Unsupported currency');
+  return { status: 'success', amount, currency };
+}
+
+export function refundPayment(paymentId: string, reason: string) {
+  if (!paymentId) throw new Error('Payment ID required');
+  if (!reason) throw new Error('Reason required');
+  return { status: 'refunded', paymentId, reason };
+}
+`);
+
+    // Create a test directory with ONE test (partial coverage)
+    fs.mkdirSync(path.join(coverageDir, 'test'), { recursive: true });
+    fs.writeFileSync(path.join(coverageDir, 'test', 'billing.test.ts'), `
+import { describe, test, expect } from 'vitest';
+import { processPayment } from '../src/billing';
+
+describe('processPayment', () => {
+  test('processes valid payment', () => {
+    const result = processPayment(100, 'USD');
+    expect(result.status).toBe('success');
+  });
+  // GAP: no test for invalid amount
+  // GAP: no test for unsupported currency
+  // GAP: refundPayment not tested at all
+});
+`);
+
+    // Init git repo with main branch
+    const run = (cmd: string, args: string[]) =>
+      spawnSync(cmd, args, { cwd: coverageDir, stdio: 'pipe', timeout: 5000 });
+    run('git', ['init', '-b', 'main']);
+    run('git', ['config', 'user.email', 'test@test.com']);
+    run('git', ['config', 'user.name', 'Test']);
+    run('git', ['add', '.']);
+    run('git', ['commit', '-m', 'initial commit']);
+
+    // Create feature branch
+    run('git', ['checkout', '-b', 'feature/billing']);
+  });
+
+  afterAll(() => {
+    try { fs.rmSync(coverageDir, { recursive: true, force: true }); } catch {}
+  });
+
+  test('/ship Step 3.4 produces coverage diagram', async () => {
+    const result = await runSkillTest({
+      prompt: `Read the file ship/SKILL.md for the ship workflow instructions.
+
+You are on the feature/billing branch. The base branch is main.
+This is a test project — there is no remote, no PR to create.
+
+ONLY run Step 3.4 (Test Coverage Audit) from the ship workflow.
+Skip all other steps (tests, evals, review, version, changelog, commit, push, PR).
+
+The source code is in ${coverageDir}/src/billing.ts.
+Existing tests are in ${coverageDir}/test/billing.test.ts.
+The test command is: echo "tests pass" (mocked — just pretend tests pass).
+
+Produce the ASCII coverage diagram showing which code paths are tested and which have gaps.
+Do NOT generate new tests — just produce the diagram and coverage summary.
+Output the diagram directly.`,
+      workingDirectory: coverageDir,
+      maxTurns: 15,
+      allowedTools: ['Bash', 'Read', 'Write', 'Edit', 'Glob', 'Grep'],
+      timeout: 120_000,
+      testName: 'ship-coverage-audit',
+      runId,
+    });
+
+    logCost('/ship coverage audit', result);
+    recordE2E('/ship Step 3.4 coverage audit', 'Test Coverage Audit E2E', result, {
+      passed: result.exitReason === 'success',
+    });
+
+    expect(result.exitReason).toBe('success');
+
+    // Check output contains coverage diagram elements
+    const output = result.output || '';
+    const hasGap = output.includes('GAP') || output.includes('gap') || output.includes('NO TEST');
+    const hasTested = output.includes('TESTED') || output.includes('tested') || output.includes('✓');
+    const hasCoverage = output.includes('COVERAGE') || output.includes('coverage') || output.includes('paths tested');
+
+    console.log(`Output has GAP markers: ${hasGap}`);
+    console.log(`Output has TESTED markers: ${hasTested}`);
+    console.log(`Output has coverage summary: ${hasCoverage}`);
+
+    // At minimum, the agent should have read the source and test files
+    const readCalls = result.toolCalls.filter(tc => tc.tool === 'Read');
+    expect(readCalls.length).toBeGreaterThan(0);
+  }, 180_000);
+});
+
 // Module-level afterAll — finalize eval collector after all tests complete
 afterAll(async () => {
   if (evalCollector) {
diff --git a/test/skill-validation.test.ts b/test/skill-validation.test.ts
index 4231a91d..54e03a4d 100644
--- a/test/skill-validation.test.ts
+++ b/test/skill-validation.test.ts
@@ -737,3 +737,225 @@ describe('gstack-slug', () => {
     expect(lines[1]).toMatch(/^BRANCH=.+/);
   });
 });
+
+// --- Test Bootstrap validation ---
+
+describe('Test Bootstrap ({{TEST_BOOTSTRAP}}) integration', () => {
+  test('TEST_BOOTSTRAP resolver produces valid content', () => {
+    const qaContent = fs.readFileSync(path.join(ROOT, 'qa', 'SKILL.md'), 'utf-8');
+    expect(qaContent).toContain('Test Framework Bootstrap');
+    expect(qaContent).toContain('RUNTIME:ruby');
+    expect(qaContent).toContain('RUNTIME:node');
+    expect(qaContent).toContain('RUNTIME:python');
+    expect(qaContent).toContain('no-test-bootstrap');
+    expect(qaContent).toContain('BOOTSTRAP_DECLINED');
+  });
+
+  test('TEST_BOOTSTRAP appears in qa/SKILL.md', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('Test Framework Bootstrap');
+    expect(content).toContain('TESTING.md');
+    expect(content).toContain('CLAUDE.md');
+  });
+
+  test('TEST_BOOTSTRAP appears in ship/SKILL.md', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('Test Framework Bootstrap');
+    expect(content).toContain('Step 2.5');
+  });
+
+  test('TEST_BOOTSTRAP appears in qa-design-review/SKILL.md', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa-design-review', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('Test Framework Bootstrap');
+  });
+
+  test('TEST_BOOTSTRAP does NOT appear in qa-only/SKILL.md', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa-only', 'SKILL.md'), 'utf-8');
+    expect(content).not.toContain('Test Framework Bootstrap');
+    // But should have the recommendation note
+    expect(content).toContain('No test framework detected');
+    expect(content).toContain('Run `/qa` to bootstrap');
+  });
+
+  test('bootstrap includes framework knowledge table', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('vitest');
+    expect(content).toContain('minitest');
+    expect(content).toContain('pytest');
+    expect(content).toContain('cargo test');
+    expect(content).toContain('phpunit');
+    expect(content).toContain('ExUnit');
+  });
+
+  test('bootstrap includes CI/CD pipeline generation', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('.github/workflows/test.yml');
+    expect(content).toContain('GitHub Actions');
+  });
+
+  test('bootstrap includes first real tests step', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('First real tests');
+    expect(content).toContain('git log --since=30.days');
+    expect(content).toContain('Prioritize by risk');
+  });
+
+  test('bootstrap includes vibe coding philosophy', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('vibe coding');
+    expect(content).toContain('100% test coverage');
+  });
+
+  test('WebSearch is in allowed-tools for qa, ship, qa-design-review', () => {
+    const qa = fs.readFileSync(path.join(ROOT, 'qa', 'SKILL.md'), 'utf-8');
+    const ship = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+    const qaDesign = fs.readFileSync(path.join(ROOT, 'qa-design-review', 'SKILL.md'), 'utf-8');
+    expect(qa).toContain('WebSearch');
+    expect(ship).toContain('WebSearch');
+    expect(qaDesign).toContain('WebSearch');
+  });
+});
+
+// --- Phase 8e.5 regression test validation ---
+
+describe('Phase 8e.5 regression test generation', () => {
+  test('qa/SKILL.md contains Phase 8e.5', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('8e.5. Regression Test');
+    expect(content).toContain('test(qa): regression test');
+    expect(content).toContain('WTF-likelihood exclusion');
+  });
+
+  test('qa/SKILL.md Rule 13 is amended for regression tests', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('Only modify tests when generating regression tests in Phase 8e.5');
+    expect(content).not.toContain('Never modify tests or CI configuration');
+  });
+
+  test('qa-design-review has CSS-aware Phase 8e.5 variant', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa-design-review', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('8e.5. Regression Test (design-review variant)');
+    expect(content).toContain('CSS-only');
+    expect(content).toContain('test(design): regression test');
+  });
+
+  test('regression test includes full attribution comment format', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('// Regression: ISSUE-NNN');
+    expect(content).toContain('// Found by /qa on');
+    expect(content).toContain('// Report: .gstack/qa-reports/');
+  });
+
+  test('regression test uses auto-incrementing names', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('auto-incrementing');
+    expect(content).toContain('max number + 1');
+  });
+});
+
+// --- Step 3.4 coverage audit validation ---
+
+describe('Step 3.4 test coverage audit', () => {
+  test('ship/SKILL.md contains Step 3.4', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('Step 3.4: Test Coverage Audit');
+    expect(content).toContain('CODE PATH COVERAGE');
+  });
+
+  test('Step 3.4 includes quality scoring rubric', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('★★★');
+    expect(content).toContain('★★');
+    expect(content).toContain('edge cases AND error paths');
+    expect(content).toContain('happy path only');
+  });
+
+  test('Step 3.4 includes before/after test count', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('Count test files before');
+    expect(content).toContain('Count test files after');
+  });
+
+  test('ship PR body includes Test Coverage section', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('## Test Coverage');
+  });
+
+  test('ship rules include test generation rule', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('Step 3.4 generates coverage tests');
+    expect(content).toContain('Never commit failing tests');
+  });
+
+  test('Step 3.4 includes vibe coding philosophy', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('vibe coding becomes yolo coding');
+  });
+
+  test('Step 3.4 traces actual codepaths, not just syntax', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('Trace every codepath');
+    expect(content).toContain('Trace data flow');
+    expect(content).toContain('Diagram the execution');
+  });
+
+  test('Step 3.4 maps user flows and interaction edge cases', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('Map user flows');
+    expect(content).toContain('Interaction edge cases');
+    expect(content).toContain('Double-click');
+    expect(content).toContain('Navigate away');
+    expect(content).toContain('Error states the user can see');
+    expect(content).toContain('Empty/zero/boundary states');
+  });
+
+  test('Step 3.4 diagram includes USER FLOW COVERAGE section', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('USER FLOW COVERAGE');
+    expect(content).toContain('Code paths:');
+    expect(content).toContain('User flows:');
+  });
+});
+
+// --- Retro test health validation ---
+
+describe('Retro test health tracking', () => {
+  test('retro/SKILL.md has test health data gathering commands', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'retro', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('# 10. Test file count');
+    expect(content).toContain('# 11. Regression test commits');
+    expect(content).toContain('# 12. Test files changed');
+  });
+
+  test('retro/SKILL.md has Test Health metrics row', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'retro', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('Test Health');
+    expect(content).toContain('regression tests');
+  });
+
+  test('retro/SKILL.md has Test Health narrative section', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'retro', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('### Test Health');
+    expect(content).toContain('Total test files');
+    expect(content).toContain('vibe coding safe');
+  });
+
+  test('retro JSON schema includes test_health field', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'retro', 'SKILL.md'), 'utf-8');
+    expect(content).toContain('test_health');
+    expect(content).toContain('total_test_files');
+    expect(content).toContain('regression_test_commits');
+  });
+});
+
+// --- QA report template regression tests section ---
+
+describe('QA report template', () => {
+  test('qa-report-template.md has Regression Tests section', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'qa', 'templates', 'qa-report-template.md'), 'utf-8');
+    expect(content).toContain('## Regression Tests');
+    expect(content).toContain('committed / deferred / skipped');
+    expect(content).toContain('### Deferred Tests');
+    expect(content).toContain('**Precondition:**');
+  });
+});

From 1f3b6914112ab7c9ba6c08e66d6774801f1c25d9 Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 13:06:14 -0500
Subject: [PATCH 16/22] feat: /gstack-upgrade detects and syncs stale vendored
 copies (v0.5.4.1) (#137)

When the global gstack is already up to date, standalone /gstack-upgrade
now checks if the local vendored copy in the current project is at a
different version and syncs it automatically. Also adds rollback on
setup failure and update-check fallback matching the preamble pattern.

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 CHANGELOG.md                 | 10 ++++++++++
 VERSION                      |  2 +-
 gstack-upgrade/SKILL.md      | 28 ++++++++++++++++++++++++++--
 gstack-upgrade/SKILL.md.tmpl | 28 ++++++++++++++++++++++++++--
 4 files changed, 63 insertions(+), 5 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 12fa243b..4593d3f1 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,15 @@
 # Changelog
 
+## 0.6.0.1 — 2026-03-17
+
+- **`/gstack-upgrade` now catches stale vendored copies automatically.** If your global gstack is up to date but the vendored copy in your project is behind, `/gstack-upgrade` detects the mismatch and syncs it. No more manually asking "did we vendor it?" — it just tells you and offers to update.
+- **Upgrade sync is safer.** If `./setup` fails while syncing a vendored copy, gstack restores the previous version from backup instead of leaving a broken install.
+
+### For contributors
+
+- Standalone usage section in `gstack-upgrade/SKILL.md.tmpl` now references Steps 2 and 4.5 (DRY) instead of duplicating detection/sync bash blocks. Added one new version-comparison bash block.
+- Update check fallback in standalone mode now matches the preamble pattern (global path → local path → `|| true`).
+
 ## 0.6.0 — 2026-03-17
 
 - **100% test coverage is the key to great vibe coding.** gstack now bootstraps test frameworks from scratch when your project doesn't have one. Detects your runtime, researches the best framework, asks you to pick, installs it, writes 3-5 real tests for your actual code, sets up CI/CD (GitHub Actions), creates TESTING.md, and adds test culture instructions to CLAUDE.md. Every Claude Code session after that writes tests naturally.
diff --git a/VERSION b/VERSION
index a918a2aa..758efdb4 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.6.0
+0.6.0.1
diff --git a/gstack-upgrade/SKILL.md b/gstack-upgrade/SKILL.md
index 9d635651..50b67dfc 100644
--- a/gstack-upgrade/SKILL.md
+++ b/gstack-upgrade/SKILL.md
@@ -156,6 +156,13 @@ rm -rf "$LOCAL_GSTACK.bak"
 ```
 Tell user: "Also updated vendored copy at `$LOCAL_GSTACK` — commit `.claude/skills/gstack/` when you're ready."
 
+If `./setup` fails, restore from backup and warn the user:
+```bash
+rm -rf "$LOCAL_GSTACK"
+mv "$LOCAL_GSTACK.bak" "$LOCAL_GSTACK"
+```
+Tell user: "Sync failed — restored previous version at `$LOCAL_GSTACK`. Run `/gstack-upgrade` manually to retry."
+
 ### Step 5: Write marker + clear cache
 
 ```bash
@@ -193,9 +200,26 @@ When invoked directly as `/gstack-upgrade` (not from a preamble):
 
 1. Force a fresh update check (bypass cache):
 ```bash
-~/.claude/skills/gstack/bin/gstack-update-check --force
+~/.claude/skills/gstack/bin/gstack-update-check --force 2>/dev/null || \
+.claude/skills/gstack/bin/gstack-update-check --force 2>/dev/null || true
 ```
 Use the output to determine if an upgrade is available.
 
 2. If `UPGRADE_AVAILABLE <old> <new>`: follow Steps 2-6 above.
-3. If no output (up to date): tell the user "You're already on the latest version (v{version})."
+
+3. If no output (primary is up to date): check for a stale local vendored copy.
+
+Run the Step 2 bash block above to detect the primary install type and directory (`INSTALL_TYPE` and `INSTALL_DIR`). Then run the Step 4.5 detection bash block above to check for a local vendored copy (`LOCAL_GSTACK`).
+
+**If `LOCAL_GSTACK` is empty** (no local vendored copy): tell the user "You're already on the latest version (v{version})."
+
+**If `LOCAL_GSTACK` is non-empty**, compare versions:
+```bash
+PRIMARY_VER=$(cat "$INSTALL_DIR/VERSION" 2>/dev/null || echo "unknown")
+LOCAL_VER=$(cat "$LOCAL_GSTACK/VERSION" 2>/dev/null || echo "unknown")
+echo "PRIMARY=$PRIMARY_VER LOCAL=$LOCAL_VER"
+```
+
+**If versions differ:** follow the Step 4.5 sync bash block above to update the local copy from the primary. Tell user: "Global v{PRIMARY_VER} is up to date. Updated local vendored copy from v{LOCAL_VER} → v{PRIMARY_VER}. Commit `.claude/skills/gstack/` when you're ready."
+
+**If versions match:** tell the user "You're on the latest version (v{PRIMARY_VER}). Global and local vendored copy are both up to date."
diff --git a/gstack-upgrade/SKILL.md.tmpl b/gstack-upgrade/SKILL.md.tmpl
index a441b8d6..0acf16c2 100644
--- a/gstack-upgrade/SKILL.md.tmpl
+++ b/gstack-upgrade/SKILL.md.tmpl
@@ -154,6 +154,13 @@ rm -rf "$LOCAL_GSTACK.bak"
 ```
 Tell user: "Also updated vendored copy at `$LOCAL_GSTACK` — commit `.claude/skills/gstack/` when you're ready."
 
+If `./setup` fails, restore from backup and warn the user:
+```bash
+rm -rf "$LOCAL_GSTACK"
+mv "$LOCAL_GSTACK.bak" "$LOCAL_GSTACK"
+```
+Tell user: "Sync failed — restored previous version at `$LOCAL_GSTACK`. Run `/gstack-upgrade` manually to retry."
+
 ### Step 5: Write marker + clear cache
 
 ```bash
@@ -191,9 +198,26 @@ When invoked directly as `/gstack-upgrade` (not from a preamble):
 
 1. Force a fresh update check (bypass cache):
 ```bash
-~/.claude/skills/gstack/bin/gstack-update-check --force
+~/.claude/skills/gstack/bin/gstack-update-check --force 2>/dev/null || \
+.claude/skills/gstack/bin/gstack-update-check --force 2>/dev/null || true
 ```
 Use the output to determine if an upgrade is available.
 
 2. If `UPGRADE_AVAILABLE <old> <new>`: follow Steps 2-6 above.
-3. If no output (up to date): tell the user "You're already on the latest version (v{version})."
+
+3. If no output (primary is up to date): check for a stale local vendored copy.
+
+Run the Step 2 bash block above to detect the primary install type and directory (`INSTALL_TYPE` and `INSTALL_DIR`). Then run the Step 4.5 detection bash block above to check for a local vendored copy (`LOCAL_GSTACK`).
+
+**If `LOCAL_GSTACK` is empty** (no local vendored copy): tell the user "You're already on the latest version (v{version})."
+
+**If `LOCAL_GSTACK` is non-empty**, compare versions:
+```bash
+PRIMARY_VER=$(cat "$INSTALL_DIR/VERSION" 2>/dev/null || echo "unknown")
+LOCAL_VER=$(cat "$LOCAL_GSTACK/VERSION" 2>/dev/null || echo "unknown")
+echo "PRIMARY=$PRIMARY_VER LOCAL=$LOCAL_VER"
+```
+
+**If versions differ:** follow the Step 4.5 sync bash block above to update the local copy from the primary. Tell user: "Global v{PRIMARY_VER} is up to date. Updated local vendored copy from v{LOCAL_VER} → v{PRIMARY_VER}. Commit `.claude/skills/gstack/` when you're ready."
+
+**If versions match:** tell the user "You're on the latest version (v{PRIMARY_VER}). Global and local vendored copy are both up to date."

From 9d47619e4c721365744c080d27455268ee93ed96 Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 16:34:08 -0500
Subject: [PATCH 17/22] =?UTF-8?q?feat:=20Completeness=20Principle=20?=
 =?UTF-8?q?=E2=80=94=20Boil=20the=20Lake=20(v0.6.1)=20(#140)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* feat: Completeness Principle — Boil the Lake (WIP, pre-merge)

Add Completeness Principle to all skill preambles, dual-time estimates,
compression table, anti-pattern gallery, Lake Score, and completeness
gaps review category. VERSION/CHANGELOG will be rebased after merge.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* fix: update stale version reference in TODOS.md (v0.5.3 → v0.6.1)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: update CHANGELOG date + README for v0.6.1 features

- Add date to CHANGELOG 0.6.1 entry
- Add Completeness Principle to README intro
- Add SELECTIVE EXPANSION mode to CEO review section
- Add test bootstrap mention to /ship section
- Fix uninstall command missing design-consultation in project uninstall
- Add "recommends shortcuts" and "no tests" to Without gstack list

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: split README into lean intro + docs/ directory (gh CLI pattern)

README: 875 → 243 lines. Keeps intro, skill table, demo, install, and
troubleshooting. All per-skill deep dives, Greptile integration guide,
and contributor mode docs moved to docs/ directory.

- docs/skills.md — full philosophy and examples for all 13 skills
- docs/greptile.md — Greptile setup and triage workflow
- docs/contributor-mode.md — how to enable and use contributor mode
- README now links to docs/ via Documentation table
- Updated skill table entries with latest features (fix-first, regression
  tests, test health, completeness gaps)
- Updated demo transcript with AUTO-FIXED, coverage audit, regression test

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: remove "competitor" language, rewrite README in Garry's voice

Replace "browses competitors" with "knows the landscape" / "what's out
there" throughout all user-facing copy. Trim README from 243 to 167
lines — tighter, more opinionated, less listicle energy. Remove
Completeness Principle from README top (it lives in CLAUDE.md and the
skill preambles where Claude actually reads it).

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: rewrite README in Garry's raw voice — AGI era, L8 factory, real stories

The README now sounds like Garry, not a product page. Leads with the
live experiment, the 16k LOC/day reality, the real-life coding stories
(Austin, hospital bedside). Highlights the newest unlocks (design at
the heart, /qa parallelism, smart review routing, test bootstrap).
Closes with an open invitation — free MIT, fork it, let's all ride
the wave together.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: add Garry's bonafides to README intro — Palantir, Posterous, YC, 600k LOC

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: add real /retro numbers — 140k lines, 362 commits across 3 projects

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: add "in the last 60 days" timeframe to 600k LOC claim

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: add GitHub contribution graphs — 2026 vs 2013 side by side

Same person, different era. 2013: 772 contributions building Bookface.
2026: 1,237 contributions and accelerating. The difference is the tooling.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: clarify /retro stats are from last 7 days

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: add designer/PM/eng manager roles to intro

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: remove Josh/L8 reference from README

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: move demo up, make it dramatically more impressive

Show the actual architecture diagram, auto-fixed issues, 100% coverage,
regression test generation. Punch line: "That is not a copilot. That is
a team."

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: remove "My journey" section — intro already covers it

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: prefix all skill commands with You: in demo transcript

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: collapse You/Claude lines in demo — no gap between command and response

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: clarify plan mode flow in demo — approve, exit, Claude implements

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: move /ship to end of demo — review → QA → ship is the real flow

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: add /plan-design-review to demo, tighten CEO response

Shorter CEO reply, compressed eng diagram, added design audit with
AI Slop score. Seven commands now: plan → eng → build → design →
review → QA → ship.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: move design review before implementation — it's part of planning

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: reorder demo — design before eng, after CEO

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: remove URL from /plan-design-review in demo

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: add [...] annotations showing what actually happens at each step

Each step now shows what the agent does under the hood: 8 expansion
proposals cherry-picked, 80-item design audit, ASCII diagrams for
every flow, 2400 lines written in 8 minutes, real browser QA, bug
found and fixed. Makes the demo feel real, not abstract.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: rename Contributor Mode to How to Contribute in docs table

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: add Coinbase, Instacart, Rippling to YC bonafides

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: add "one or two people in a garage" to founder story

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: add skill table to top of skills.md with anchor links

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

* docs: consolidate — roll contributor-mode into CONTRIBUTING, greptile into skills

- docs/contributor-mode.md → merged into CONTRIBUTING.md (session awareness section)
- docs/greptile.md → merged into docs/skills.md (Greptile integration section)
- Reordered docs table: Skills > Architecture > Browser > Contributing > Changelog

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 CHANGELOG.md                      |  25 +-
 CLAUDE.md                         |  17 +
 CONTRIBUTING.md                   |   4 +
 README.md                         | 885 ++++--------------------------
 SKILL.md                          |  43 +-
 TODOS.md                          |  24 +
 VERSION                           |   2 +-
 browse/SKILL.md                   |  43 +-
 design-consultation/SKILL.md      |  61 +-
 design-consultation/SKILL.md.tmpl |  18 +-
 docs/images/github-2013.png       | Bin 0 -> 63425 bytes
 docs/images/github-2026.png       | Bin 0 -> 60481 bytes
 docs/skills.md                    | 649 ++++++++++++++++++++++
 document-release/SKILL.md         |  43 +-
 plan-ceo-review/SKILL.md          |  52 +-
 plan-ceo-review/SKILL.md.tmpl     |   9 +-
 plan-design-review/SKILL.md       |  43 +-
 plan-eng-review/SKILL.md          |  48 +-
 plan-eng-review/SKILL.md.tmpl     |   5 +-
 qa-design-review/SKILL.md         |  43 +-
 qa-only/SKILL.md                  |  43 +-
 qa/SKILL.md                       |  43 +-
 retro/SKILL.md                    |  43 +-
 review/SKILL.md                   |  43 +-
 review/checklist.md               |   7 +
 scripts/gen-skill-docs.ts         |  43 +-
 setup-browser-cookies/SKILL.md    |  43 +-
 ship/SKILL.md                     |  43 +-
 test/skill-e2e.test.ts            |   2 +-
 test/skill-validation.test.ts     |  37 ++
 30 files changed, 1529 insertions(+), 832 deletions(-)
 create mode 100644 docs/images/github-2013.png
 create mode 100644 docs/images/github-2026.png
 create mode 100644 docs/skills.md

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 4593d3f1..be473577 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,28 @@
 # Changelog
 
+## 0.6.1 — 2026-03-17 — Boil the Lake
+
+Every gstack skill now follows the **Completeness Principle**: always recommend the
+full implementation when AI makes the marginal cost near-zero. No more "Choose B
+because it's 90% of the value" when option A is 70 lines more code.
+
+Read the philosophy: https://garryslist.org/posts/boil-the-ocean
+
+- **Completeness scoring**: every AskUserQuestion option now shows a completeness
+  score (1-10), biasing toward the complete solution
+- **Dual time estimates**: effort estimates show both human-team and CC+gstack time
+  (e.g., "human: ~2 weeks / CC: ~1 hour") with a task-type compression reference table
+- **Anti-pattern examples**: concrete "don't do this" gallery in the preamble so the
+  principle isn't abstract
+- **First-time onboarding**: new users see a one-time introduction linking to the
+  essay, with option to open in browser
+- **Review completeness gaps**: `/review` now flags shortcut implementations where the
+  complete version costs <30 min CC time
+- **Lake Score**: CEO and Eng review completion summaries show how many recommendations
+  chose the complete option vs shortcuts
+- **CEO + Eng review dual-time**: temporal interrogation, effort estimates, and delight
+  opportunities all show both human and CC time scales
+
 ## 0.6.0.1 — 2026-03-17
 
 - **`/gstack-upgrade` now catches stale vendored copies automatically.** If your global gstack is up to date but the vendored copy in your project is behind, `/gstack-upgrade` detects the mismatch and syncs it. No more manually asking "did we vendor it?" — it just tells you and offers to update.
@@ -63,7 +86,7 @@
 ## 0.5.2 — 2026-03-17
 
 - **Your design consultant now takes creative risks.** `/design-consultation` doesn't just propose a safe, coherent system — it explicitly breaks down SAFE CHOICES (category baseline) vs. RISKS (where your product stands out). You pick which rules to break. Every risk comes with a rationale for why it works and what it costs.
-- **See the competition before you choose.** When you opt into research, the agent browses competitor sites with screenshots and accessibility tree analysis — not just web search results. You see what the landscape looks like before making design decisions.
+- **See the landscape before you choose.** When you opt into research, the agent browses real sites in your space with screenshots and accessibility tree analysis — not just web search results. You see what's out there before making design decisions.
 - **Preview pages that look like your product.** The preview page now renders realistic product mockups — dashboards with sidebar nav and data tables, marketing pages with hero sections, settings pages with forms — not just font swatches and color palettes.
 
 ## 0.5.1 — 2026-03-17
diff --git a/CLAUDE.md b/CLAUDE.md
index 27523c7b..34868b0a 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -121,6 +121,23 @@ CHANGELOG.md is **for users**, not contributors. Write it like product release n
 - No jargon: say "every question now tells you which project and branch you're in" not
   "AskUserQuestion format standardized across skill templates via preamble resolver."
 
+## AI effort compression
+
+When estimating or discussing effort, always show both human-team and CC+gstack time:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+Completeness is cheap. Don't recommend shortcuts when the complete implementation
+is a "lake" (achievable) not an "ocean" (multi-quarter migration). See the
+Completeness Principle in the skill preamble for the full philosophy.
+
 ## Local plans
 
 Contributors can store long-range vision docs and design documents in `~/.gstack-dev/plans/`.
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 4af2e889..2fce6375 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -54,6 +54,10 @@ the issue, fix it, and open a PR.
 This is the best way to contribute: fix gstack while doing your real work, in the
 project where you actually felt the pain.
 
+### Session awareness
+
+When you have 3+ gstack sessions open simultaneously, every question tells you which project, which branch, and what's happening. No more staring at a question thinking "wait, which window is this?" The format is consistent across all 13 skills.
+
 ## Working on gstack inside the gstack repo
 
 When you're editing gstack skills and want to test them by actually using gstack
diff --git a/README.md b/README.md
index fd4b684f..c0a5f0b6 100644
--- a/README.md
+++ b/README.md
@@ -1,136 +1,136 @@
 # gstack
 
-**gstack turns Claude Code from one generic assistant into a team of specialists you can summon on demand.**
+Hi, I'm [Garry Tan](https://x.com/garrytan). I'm President & CEO of [Y Combinator](https://www.ycombinator.com/), where I've worked with thousands of startups including Coinbase, Instacart, and Rippling when the founders were just one or two people in a garage — companies now worth tens of billions of dollars. Before YC, I designed the Palantir logo and was one of the first eng manager/PM/designers there. I cofounded Posterous, a blog platform we sold to Twitter. I built Bookface, YC's internal social network, back in 2013. I've been building products as a designer, PM, and eng manager for a long time.
 
-Thirteen opinionated workflow skills for [Claude Code](https://docs.anthropic.com/en/docs/claude-code). Plan review, design review, code review, one-command shipping, browser automation, QA testing, engineering retrospectives, and post-ship documentation — all as slash commands.
+And right now I am in the middle of something that feels like a new era entirely.
 
-### Without gstack
+In the last 60 days I have written **over 600,000 lines of production code** — 35% tests — and I am doing **10,000 to 20,000 usable lines of code per day** as a part-time part of my day while doing all my duties as CEO of YC. That is not a typo. My last `/retro` (developer stats from the last 7 days) across 3 projects: **140,751 lines added, 362 commits, ~115k net LOC**. The models are getting dramatically better every week. We are at the dawn of something real — one person shipping at a scale that used to require a team of twenty.
 
-- The agent takes your request literally — it never asks if you're building the right thing
-- It will implement exactly what you said, even when the real product is something bigger
-- "Review my PR" gives inconsistent depth every time
-- "Ship this" turns into a long back-and-forth about what to do
-- The agent can write code but can't see your app — it's half blind
-- You still do QA by hand: open browser, click around, check pages, squint at layouts
+**2026 — 1,237 contributions and counting:**
 
-### With gstack
+![GitHub contributions 2026 — 1,237 contributions, massive acceleration in Jan-Mar](docs/images/github-2026.png)
 
-| Skill | Mode | What it does |
-|-------|------|--------------|
-| `/plan-ceo-review` | Founder / CEO | Rethink the problem. Find the 10-star product hiding inside the request. |
-| `/plan-eng-review` | Eng manager / tech lead | Lock in architecture, data flow, diagrams, edge cases, and tests. |
-| `/plan-design-review` | Senior product designer | Designer's eye audit. 80-item checklist, letter grades, AI Slop detection, DESIGN.md inference. Report only — never touches code. |
-| `/design-consultation` | Design consultant | Build a complete design system from scratch. Browses competitors to get in the ballpark, proposes safe choices AND creative risks, generates realistic product mockups, and writes DESIGN.md. |
-| `/review` | Paranoid staff engineer | Find the bugs that pass CI but blow up in production. Triages Greptile review comments. |
-| `/ship` | Release engineer | Sync main, run tests, resolve Greptile reviews, push, open PR. For a ready branch, not for deciding what to build. |
-| `/browse` | QA engineer | Give the agent eyes. It logs in, clicks through your app, takes screenshots, catches breakage. Full QA pass in 60 seconds. |
-| `/qa` | QA + fix engineer | Test app, find bugs, fix them with atomic commits, re-verify. Before/after health scores and ship-readiness summary. Three tiers: Quick, Standard, Exhaustive. |
-| `/qa-only` | QA reporter | Report-only QA testing. Same methodology as /qa but never fixes anything. Use when you want a pure bug report without code changes. |
-| `/qa-design-review` | Designer + frontend engineer | Same design audit as /plan-design-review, then fixes what it finds. Atomic `style(design):` commits, before/after screenshots, CSS-safe self-regulation. |
-| `/setup-browser-cookies` | Session manager | Import cookies from your real browser (Comet, Chrome, Arc, Brave, Edge) into the headless session. Test authenticated pages without logging in manually. |
-| `/retro` | Engineering manager | Team-aware retro: your deep-dive + per-person praise and growth opportunities for every contributor. |
-| `/document-release` | Technical writer | Update README, ARCHITECTURE, CONTRIBUTING, and project docs to match what you just shipped. |
+**2013 — when I built Bookface at YC (772 contributions):**
 
-## Demo: one feature, five modes
+![GitHub contributions 2013 — 772 contributions building Bookface at YC](docs/images/github-2013.png)
 
-I start almost every feature in plan mode. I describe what I want to build, then use `/plan-ceo-review` to pressure-test whether I am even building the right thing. Only after the product direction is locked do I shift into engineering, review, ship, and test.
+Same person. Different era. The difference is the tooling.
 
-```
-You:   [enter plan mode, describe the feature]
-       I want to add seller photo upload to the listing app. Sellers
-       should be able to upload a photo of their item and we create
-       the listing from it.
-
-You:   /plan-ceo-review
-
-Claude: "Photo upload" is not the feature. The real job is helping sellers
-        create listings that actually sell. Here's what the 10-star version
-        looks like: auto-identify the product from the photo, pull specs and
-        pricing comps from the web, draft the title and description, suggest
-        the best hero image...
+**gstack is how I do it.** It is my open source software factory. It turns Claude Code into a virtual engineering team you actually manage — a CEO who rethinks the product, an eng manager who locks the architecture, a designer who catches AI slop, a paranoid reviewer who finds production bugs, a QA lead who opens a real browser and clicks through your app, and a release engineer who ships the PR. Thirteen specialists, all as slash commands, all Markdown, **all free, MIT license, available right now.**
 
-You:   /plan-eng-review
+I am learning how to get to the edge of what agentic systems can do as of March 2026, and this is my live experiment. I am sharing it because I want the whole world on this journey with me.
 
-Claude: [Architecture diagram, state machine for upload → classify → enrich
-        → draft pipeline, async job boundaries, failure modes, test matrix]
+Fork it. Improve it. Make it yours. Don't player hate, appreciate.
 
-You:   [exit plan mode, implement the plan]
+---
 
-You:   /review
+## See it work
 
-Claude: Race condition: two tabs can overwrite cover-photo selection.
-        Trust boundary: pulling web data into draft generation creates
-        a prompt injection vector. Missing: orphan cleanup for failed uploads.
+```
+You:    I want to add photo upload for sellers.
+You:    /plan-ceo-review
+Claude: "Photo upload" is not the feature. The real job is helping
+        sellers create listings that actually sell. What if we
+        auto-identify the product, pull specs and comps from the
+        web, and draft the listing automatically? That's 10 stars.
+        "Upload a photo" is 3 stars. Which are we building?
+        [8 expansion proposals, you cherry-pick 5, defer 3 to backlog]
 
-You:   (fix the issues)
+You:    /plan-design-review
+Claude: Design Score: B  |  AI Slop Score: C
+        "Upload flow looks like a default Bootstrap form."
+        [80-item audit, infers your design system, exports DESIGN.md]
+        [flags 3 AI slop patterns: gradient hero, icon grid, uniform radius]
 
-You:   /ship
+You:    /plan-eng-review
+Claude: ┌─────────┐    ┌──────────┐    ┌──────────┐    ┌─────────┐
+        │ Upload  │───▶│ Classify │───▶│ Enrich   │───▶│ Draft   │
+        │ (sync)  │    │ (async)  │    │ (async)  │    │ (async) │
+        └─────────┘    └──────────┘    └──────────┘    └─────────┘
+        [ASCII diagrams for every data flow, state machine, error path]
+        [14-case test matrix, 6 failure modes mapped, 3 security concerns]
 
-Claude: [Syncs main, runs tests, pushes branch, opens PR — 6 tool calls, done]
+You:    Approve plan. Exit plan mode.
+        [Claude writes 2,400 lines across 11 files — models, services,
+         controllers, views, migrations, and tests. ~8 minutes.]
 
-You:   /qa
+You:    /review
+Claude: [AUTO-FIXED] Orphan S3 cleanup on failed upload
+        [AUTO-FIXED] Missing index on listings.status
+        [ASK] Race condition on hero image selection → You: yes
+        [traces every new enum value through all switch statements]
+        3 issues — 2 auto-fixed, 1 fixed.
 
-Claude: Analyzing branch diff... 8 files changed, 3 routes affected.
-        [Tests /listings/new, /listings/:id, /api/listings against localhost:3000]
-        All 3 routes working. Upload + enrichment flow passes end to end.
+You:    /qa https://staging.myapp.com
+Claude: [opens real browser, logs in, uploads photos, clicks through flows]
+        Upload → classify → enrich → draft: end to end ✓
+        Mobile: ✓  |  Slow connection: ✓  |  Bad image: ✓
+        [finds bug: preview doesn't clear on second upload — fixes it]
+        Regression test generated.
 
-You:   /setup-browser-cookies staging.myapp.com
+You:    /ship
+Claude: Tests: 42 → 51 (+9 new)
+        Coverage: 14/14 code paths (100%)
+        PR: github.com/you/app/pull/42
+```
 
-Claude: Imported 8 cookies for staging.myapp.com from Chrome.
+One feature. Seven commands. The agent reframed the product, ran an 80-item design audit, drew the architecture, wrote 2,400 lines of code, found a race condition I would have missed, auto-fixed two issues, opened a real browser to QA test, found and fixed a bug I didn't know about, wrote 9 tests, and generated a regression test. That is not a copilot. That is a team.
 
-You:   /qa https://staging.myapp.com --quick
+---
 
-Claude: [Smoke test: homepage + 5 pages, 30 seconds]
-        Health Score: 91/100. No critical issues. 1 medium: mobile nav overlap.
+## The team
 
-You:   /plan-design-review https://staging.myapp.com
+| Skill | Your specialist | What they do |
+|-------|----------------|--------------|
+| `/plan-ceo-review` | **CEO / Founder** | Rethink the problem. Find the 10-star product hiding inside the request. Four modes: Expansion, Selective Expansion, Hold Scope, Reduction. |
+| `/plan-eng-review` | **Eng Manager** | Lock in architecture, data flow, diagrams, edge cases, and tests. Forces hidden assumptions into the open. |
+| `/plan-design-review` | **Senior Designer** | 80-item design audit with letter grades. AI Slop detection. Infers your design system. Report only — never touches code. |
+| `/design-consultation` | **Design Partner** | Build a complete design system from scratch. Knows the landscape, proposes creative risks, generates realistic product mockups. Design at the heart of all other phases. |
+| `/review` | **Staff Engineer** | Find the bugs that pass CI but blow up in production. Auto-fixes the obvious ones. Flags completeness gaps. |
+| `/ship` | **Release Engineer** | Sync main, run tests, audit coverage, push, open PR. Bootstraps test frameworks if you don't have one. One command. |
+| `/browse` | **QA Engineer** | Give the agent eyes. Real Chromium browser, real clicks, real screenshots. ~100ms per command. |
+| `/qa` | **QA Lead** | Test your app, find bugs, fix them with atomic commits, re-verify. Auto-generates regression tests for every fix. |
+| `/qa-only` | **QA Reporter** | Same methodology as /qa but report only. Use when you want a pure bug report without code changes. |
+| `/qa-design-review` | **Designer Who Codes** | Same audit as /plan-design-review, then fixes what it finds. Atomic commits, before/after screenshots. |
+| `/setup-browser-cookies` | **Session Manager** | Import cookies from your real browser (Chrome, Arc, Brave, Edge) into the headless session. Test authenticated pages. |
+| `/retro` | **Eng Manager** | Team-aware weekly retro. Per-person breakdowns, shipping streaks, test health trends, growth opportunities. |
+| `/document-release` | **Technical Writer** | Update all project docs to match what you just shipped. Catches stale READMEs automatically. |
 
-Claude: Design Score: B  |  AI Slop Score: C
+**[Deep dives with examples and philosophy for every skill →](docs/skills.md)**
 
-        "The site communicates competence but not confidence."
-        "I notice the spacing between sections is uniform — nothing feels important."
-        "The first 3 things my eye goes to are: the gradient hero, a 3-column
-         feature grid with icons in circles, and a cookie-cutter CTA."
-        "If I had to describe this in one word: template."
+---
 
-        Top issues: generic typography (Inter everywhere), AI slop patterns
-        (3-column icon grid, purple gradient), flat heading scale.
+## What's new and why it matters
 
-        [Full report with letter grades, 12 findings, inferred design system]
-        Want me to save this as your DESIGN.md?
+**Design is at the heart.** `/design-consultation` doesn't just pick fonts. It researches what's out there in your space, proposes safe choices AND creative risks, generates realistic mockups of your actual product, and writes `DESIGN.md` — and then `/qa-design-review` and `/plan-eng-review` read what you chose. Design decisions flow through the whole system.
 
-You:   /qa-design-review
+**`/qa` was a massive unlock.** It let me go from 6 to 12 parallel workers. Claude Code saying *"I SEE THE ISSUE"* and then actually fixing it, generating a regression test, and verifying the fix — that changed how I work. The agent has eyes now.
 
-Claude: [Runs the same audit, then fixes 8 design issues]
-        style(design): FINDING-001 — replace Inter with system font stack
-        style(design): FINDING-003 — add heading scale contrast
-        style(design): FINDING-007 — break 3-column grid into asymmetric layout
-        Design Score: B → A-  |  AI Slop Score: C → A
-```
+**Smart review routing.** Just like at a well-run startup: CEO doesn't have to look at infra bug fixes, design review isn't needed for backend changes. gstack tracks what reviews are run, figures out what's appropriate, and just does the smart thing. The Review Readiness Dashboard tells you where you stand before you ship.
 
-## Who this is for
+**Test everything.** `/ship` bootstraps test frameworks from scratch if your project doesn't have one. Every `/ship` run produces a coverage audit. Every `/qa` bug fix generates a regression test. 100% test coverage is the goal — tests make vibe coding safe instead of yolo coding.
 
-You already use Claude Code heavily and want consistent, high-rigor workflows instead of one mushy generic mode. You want to tell the model what kind of brain to use right now — founder taste, engineering rigor, paranoid review, or fast execution.
+**`/document-release` is the engineer you never had.** It reads every doc file in your project, cross-references the diff, and updates everything that drifted. README, ARCHITECTURE, CONTRIBUTING, CLAUDE.md, TODOS — all kept current automatically.
 
-This is not a prompt pack for beginners. It is an operating system for people who ship.
+---
 
-## How to fly: 10 sessions at once
+## 10 sessions at once
 
-gstack is powerful with one Claude Code session. It is transformative with ten.
+gstack is powerful with one session. It is transformative with ten.
 
-[Conductor](https://conductor.build) runs multiple Claude Code sessions in parallel — each in its own isolated workspace. That means you can have one session running `/qa` on staging, another doing `/review` on a PR, a third implementing a feature, and seven more working on other branches. All at the same time.
+[Conductor](https://conductor.build) runs multiple Claude Code sessions in parallel — each in its own isolated workspace. One session running `/qa` on staging, another doing `/review` on a PR, a third implementing a feature, and seven more on other branches. All at the same time.
 
-Each workspace gets its own isolated browser instance automatically — separate Chromium process, cookies, tabs, and logs stored in `.gstack/` inside each project root. No port collisions, no shared state, no configuration needed. `/browse` and `/qa` sessions never interfere with each other, even across ten parallel workspaces.
+One person, ten parallel agents, each with the right cognitive mode. That is a different way of building software.
 
-This is the setup I use. One person, ten parallel agents, each with the right cognitive mode for its task. That is not incremental improvement. That is a different way of building software.
+---
 
-## Install
+## Install — takes 30 seconds
 
-**Requirements:** [Claude Code](https://docs.anthropic.com/en/docs/claude-code), [Git](https://git-scm.com/), [Bun](https://bun.sh/) v1.0+. `/browse` compiles a native binary — works on macOS and Linux (x64 and arm64).
+**Requirements:** [Claude Code](https://docs.anthropic.com/en/docs/claude-code), [Git](https://git-scm.com/), [Bun](https://bun.sh/) v1.0+
 
 ### Step 1: Install on your machine
 
-Open Claude Code and paste this. Claude will do the rest.
+Open Claude Code and paste this. Claude does the rest.
 
 > Install gstack: run `git clone https://github.com/garrytan/gstack.git ~/.claude/skills/gstack && cd ~/.claude/skills/gstack && ./setup` then add a "gstack" section to CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, and lists the available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review, /design-consultation, /review, /ship, /browse, /qa, /qa-only, /qa-design-review, /setup-browser-cookies, /retro, /document-release. Then ask the user if they also want to add gstack to the current project so teammates get it.
 
@@ -138,25 +138,14 @@ Open Claude Code and paste this. Claude will do the rest.
 
 > Add gstack to this project: run `cp -Rf ~/.claude/skills/gstack .claude/skills/gstack && rm -rf .claude/skills/gstack/.git && cd .claude/skills/gstack && ./setup` then add a "gstack" section to this project's CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, lists the available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review, /design-consultation, /review, /ship, /browse, /qa, /qa-only, /qa-design-review, /setup-browser-cookies, /retro, /document-release, and tells Claude that if gstack skills aren't working, run `cd .claude/skills/gstack && ./setup` to build the binary and register skills.
 
-Real files get committed to your repo (not a submodule), so `git clone` just works. The binary and node\_modules are gitignored — teammates just need to run `cd .claude/skills/gstack && ./setup` once to build (or `/browse` handles it automatically on first use).
-
-### What gets installed
-
-- Skill files (Markdown prompts) in `~/.claude/skills/gstack/` (or `.claude/skills/gstack/` for project installs)
-- Symlinks at `~/.claude/skills/browse`, `~/.claude/skills/qa`, `~/.claude/skills/review`, etc. pointing into the gstack directory
-- Browser binary at `browse/dist/browse` (~58MB, gitignored)
-- `node_modules/` (gitignored)
-- `/retro` saves JSON snapshots to `.context/retros/` in your project for trend tracking
-
-Everything lives inside `.claude/`. Nothing touches your PATH or runs in the background.
+Real files get committed to your repo (not a submodule), so `git clone` just works. Everything lives inside `.claude/`. Nothing touches your PATH or runs in the background.
 
 ---
 
 ```
 +----------------------------------------------------------------------------+
 |                                                                            |
-|   Are you a great software engineer who loves to write 10K LOC/day         |
-|   and land 10 PRs a day like Garry?                                        |
+|   Are you a great software engineer who wants to ship 10K+ LOC/day?       |
 |                                                                            |
 |   Come work at YC: ycombinator.com/software                                |
 |                                                                            |
@@ -169,694 +158,36 @@ Everything lives inside `.claude/`. Nothing touches your PATH or runs in the bac
 
 ---
 
-## How I use these skills
+## Come ride the wave
 
-Created by [Garry Tan](https://x.com/garrytan), President & CEO of [Y Combinator](https://www.ycombinator.com/).
+This is **free, MIT licensed, open source, available now.** No premium tier. No waitlist. No strings.
 
-I built gstack because I do not want AI coding tools stuck in one mushy mode.
+I open sourced how I do development and I am actively upgrading my own software factory here. You can fork it and make it your own. That's the whole point. I want everyone on this journey.
 
-Planning is not review. Review is not shipping. Founder taste is not engineering rigor. If you blur all of that together, you usually get a mediocre blend of all four.
+The models are getting better fast. The people who figure out how to work with them now — really work with them, not just dabble — are going to have a massive advantage. This is that window. Let's go.
 
-I want explicit gears.
-
-These skills let me tell the model what kind of brain I want right now. I can switch cognitive modes on demand — founder, eng manager, paranoid reviewer, release machine. That is the unlock.
+**[github.com/garrytan/gstack](https://github.com/garrytan/gstack)** — MIT License
 
 ---
 
-## `/plan-ceo-review`
-
-This is my **founder mode**.
-
-This is where I want the model to think with taste, ambition, user empathy, and a long time horizon. I do not want it taking the request literally. I want it asking a more important question first:
-
-**What is this product actually for?**
-
-I think of this as **Brian Chesky mode**.
-
-The point is not to implement the obvious ticket. The point is to rethink the problem from the user's point of view and find the version that feels inevitable, delightful, and maybe even a little magical.
-
-### Example
-
-Say I am building a Craigslist-style listing app and I say:
-
-> "Let sellers upload a photo for their item."
-
-A weak assistant will add a file picker and save an image.
-
-That is not the real product.
-
-In `/plan-ceo-review`, I want the model to ask whether "photo upload" is even the feature. Maybe the real feature is helping someone create a listing that actually sells.
-
-If that is the real job, the whole plan changes.
-
-Now the model should ask:
-
-* Can we identify the product from the photo?
-* Can we infer the SKU or model number?
-* Can we search the web and draft the title and description automatically?
-* Can we pull specs, category, and pricing comps?
-* Can we suggest which photo will convert best as the hero image?
-* Can we detect when the uploaded photo is ugly, dark, cluttered, or low-trust?
-* Can we make the experience feel premium instead of like a dead form from 2007?
-
-That is what `/plan-ceo-review` does for me.
-
-It does not just ask, "how do I add this feature?"
-It asks, **"what is the 10-star product hiding inside this request?"**
-
-That is a very different kind of power.
-
----
-
-## `/plan-eng-review`
-
-This is my **eng manager mode**.
-
-Once the product direction is right, I want a different kind of intelligence entirely. I do not want more sprawling ideation. I do not want more "wouldn't it be cool if." I want the model to become my best technical lead.
-
-This mode should nail:
-
-* architecture
-* system boundaries
-* data flow
-* state transitions
-* failure modes
-* edge cases
-* trust boundaries
-* test coverage
-
-And one surprisingly big unlock for me: **diagrams**.
-
-LLMs get way more complete when you force them to draw the system. Sequence diagrams, state diagrams, component diagrams, data-flow diagrams, even test matrices. Diagrams force hidden assumptions into the open. They make hand-wavy planning much harder.
-
-So `/plan-eng-review` is where I want the model to build the technical spine that can carry the product vision.
-
-### Example
-
-Take the same listing app example.
-
-Let's say `/plan-ceo-review` already did its job. We decided the real feature is not just photo upload. It is a smart listing flow that:
-
-* uploads photos
-* identifies the product
-* enriches the listing from the web
-* drafts a strong title and description
-* suggests the best hero image
-
-Now `/plan-eng-review` takes over.
-
-Now I want the model to answer questions like:
-
-* What is the architecture for upload, classification, enrichment, and draft generation?
-* Which steps happen synchronously, and which go to background jobs?
-* Where are the boundaries between app server, object storage, vision model, search/enrichment APIs, and the listing database?
-* What happens if upload succeeds but enrichment fails?
-* What happens if product identification is low-confidence?
-* How do retries work?
-* How do we prevent duplicate jobs?
-* What gets persisted when, and what can be safely recomputed?
-
-And this is where I want diagrams — architecture diagrams, state models, data-flow diagrams, test matrices. Diagrams force hidden assumptions into the open. They make hand-wavy planning much harder.
-
-That is `/plan-eng-review`.
-
-Not "make the idea smaller."
-**Make the idea buildable.**
-
----
-
-## `/plan-design-review`
-
-This is my **senior designer mode**.
-
-Most developers cannot tell whether their site looks AI-generated. I could not, until I started paying attention. There is a growing class of sites that are functional but soulless — they work fine but scream "an AI built this and nobody with taste looked at it." Purple gradients, 3-column icon grids, uniform bubbly border-radius on everything, centered text on every section, decorative blobs floating in the background. The ChatGPT aesthetic.
-
-`/plan-design-review` gives the agent a designer's eye.
-
-It opens your site and reacts to it the way a Stripe or Linear designer would — immediately, viscerally, with opinions. The first output is a structured gut reaction: what the site communicates at a glance, what the eye is drawn to, and a one-word verdict. That is the most valuable part. Everything after is supporting evidence.
-
-Then it extracts your actual design system by reading the CSS: how many fonts are you really using? What is your heading scale? How many colors? Is your spacing on a grid or arbitrary? It structures this as an **Inferred Design System** and offers to save it as a `DESIGN.md` — so now you have a design system you never had before, derived from what you actually shipped.
-
-The audit covers 80 items across 10 categories. Typography, spacing, hierarchy, color, responsive design, interaction states, motion, content quality, performance feel, and — the headline feature — **AI Slop Detection**. Ten specific anti-patterns that mark a site as machine-generated.
-
-Every finding gets a letter grade (A through F) per category. The report opens with two headline scores: **Design Score** and **AI Slop Score**. "Your site got a B on design but a D on AI Slop" tells you exactly where to focus.
-
-### Example
-
-```
-You:   /plan-design-review https://myapp.com
-
-Claude: Design Score: C  |  AI Slop Score: D
-
-        "The site communicates generic SaaS energy."
-        "I notice the hero section uses a blue-to-purple gradient
-         with a 3-column feature grid below it — the single most
-         recognizable AI-generated layout pattern."
-        "The first 3 things my eye goes to are: the gradient, the
-         symmetrical icon grid, and a 'Get Started' button that
-         looks like every other 'Get Started' button."
-        "If I had to describe this in one word: template."
-
-        Inferred Design System:
-        - Fonts: Inter (body), Inter (headings) — 1 font family
-        - Colors: 14 unique non-gray colors (flag: >12)
-        - Heading scale: 36/24/18/16 — flat, no drama between sizes
-        - Spacing: mostly 16px and 24px — no rhythm
-
-        Top 5 Design Improvements:
-        1. Break the 3-column icon grid (High, AI Slop)
-        2. Add heading scale contrast — at least 2:1 ratio (High, Typography)
-        3. Replace uniform border-radius with intentional hierarchy (Medium, Spacing)
-        4. Kill the gradient hero — use a real image or bold typography (High, AI Slop)
-        5. Add a second font for headings — Inter-only reads as generic (Medium, Typography)
-
-        [Full report saved to .gstack/design-reports/]
-        Want me to save this inferred design system as your DESIGN.md?
-```
-
-This is report only — it never touches your code. Use `/qa-design-review` when you want it to fix what it finds.
-
----
-
-## `/design-consultation`
-
-This is my **design partner mode**.
-
-`/plan-design-review` audits a site that already exists. `/design-consultation` is for when you have nothing yet — no design system, no font choices, no color palette. You are starting from zero and you want a senior designer to sit down with you and build the whole visual identity together.
-
-It is a conversation, not a form. The agent asks about your product, your users, and your audience. It thinks about what your product needs to communicate — trust, speed, craft, warmth, whatever fits — and works backward from that to concrete choices. Then it proposes a complete, coherent design system: aesthetic direction, typography (3+ fonts with specific roles), color palette with hex values, spacing scale, layout approach, and motion strategy. Every recommendation comes with a rationale. Every choice reinforces every other choice.
-
-But coherence is table stakes. Every dev tool dashboard looks the same — clean sans-serif, muted grays, a blue accent. They are all coherent. They are all forgettable. The difference between a product that looks "nice" and one that people actually recognize is the **deliberate creative risks**: the unexpected serif for headings, the bold accent nobody else in your category uses, the tighter spacing that makes your data feel authoritative instead of airy.
-
-That is what `/design-consultation` is really about. It does not just propose a safe system. It proposes safe choices AND risks — and tells you which is which. "Here are the choices that keep you literate in your category. And here is where I think you should break from convention, and why." You pick which risks to take. The agent checks that the whole system still coheres either way.
-
-If you want, the agent will browse your competitors' actual sites — take screenshots, analyze their fonts and colors and spacing — so you can see the landscape before you make choices. This is not about copying. It is about getting in the ballpark so you know what the conventions are, and then deciding which ones are worth breaking.
-
-After you agree on the system, it generates an interactive HTML preview page — not just swatches and font samples, but realistic product pages. If you are building a dashboard, you see a dashboard with a sidebar, data tables, and stat cards. If you are building a marketing site, you see a hero section with real copy and a CTA. Everything rendered in your design system, with your product name, in light and dark mode. You see what your product could feel like before a single line of production code is written.
-
-Then it writes `DESIGN.md` to your repo root — your project's design source of truth — and updates `CLAUDE.md` so every future Claude Code session respects the system. From that point on, `/qa-design-review` can audit against it, and any agent working on your frontend knows the rules.
-
-```
-You:   /design-consultation
-
-Claude: From the README, this looks like a developer analytics dashboard
-        for engineering teams. Sound right? Tell me about the feeling
-        you want — and would you like me to browse some competitors
-        first so we can see the landscape?
-
-You:    Yes, it's for eng managers. Show me what's out there.
-
-Claude: [browses Linear, Vercel, Datadog, Posthog — takes screenshots]
-
-        Here's the landscape. They all converge on clean sans-serifs
-        and muted blue-gray palettes. Linear stands out with dark-first
-        and tight spacing. The rest feel interchangeable.
-
-        Here's my proposal — and where I'd play it safe vs. take risks:
-
-        AESTHETIC: Industrial/Utilitarian — data-first, every pixel earns its place
-        TYPOGRAPHY: Geist (body + UI), Instrument Serif (display), JetBrains Mono (data)
-        COLOR: Restrained — slate neutrals, single teal accent (#0D9488)
-        SPACING: 4px base, compact density
-        LAYOUT: Grid-disciplined, 12-column
-        MOTION: Minimal-functional — only transitions that aid comprehension
-
-        SAFE CHOICES (match category expectations):
-          Geist for body — your users already know this font from Vercel
-          Slate neutrals — warm grays feel right for data-heavy UIs
-          Grid-disciplined layout — dashboards need predictable alignment
-
-        RISKS (where you'd stand out):
-          Instrument Serif for display headings — nobody in dev tools
-            uses a serif. It creates instant hierarchy contrast and
-            signals "we care about craft" in a space full of sans-serifs.
-          Single teal accent instead of blue — every competitor uses blue.
-            Teal is close enough to feel trustworthy, different enough
-            to be recognizable.
-          4px compact density — tighter than Linear, says "we respect
-            your screen real estate."
-
-        The safe choices keep you literate. The risks are where your
-        product gets its own face. Which risks appeal to you?
-
-You:    Love the serif risk. Let's see it.
-
-Claude: Preview opened in your browser.
-        [/tmp/design-consultation-preview-1710000000.html]
-
-        The page shows a realistic dashboard: sidebar nav, header with
-        avatar, stat cards, data table — all in your design system.
-        Instrument Serif at hero scale, Geist in body text, JetBrains
-        Mono in the data table. Teal accent on buttons and active states.
-        Light and dark mode toggle in the corner.
-
-        How does it feel? Want to adjust anything before I write DESIGN.md?
-
-You:    Ship it.
-
-Claude: Wrote DESIGN.md (typography, color, spacing, layout, motion).
-        Updated CLAUDE.md with design system guidelines.
-        All future sessions will respect these choices.
-```
-
----
-
-## `/qa-design-review`
-
-This is my **designer who codes mode**.
-
-`/plan-design-review` tells you what is wrong. `/qa-design-review` fixes it.
-
-It runs the same 80-item audit, then enters a fix loop: for each design finding, it locates the source file, makes the minimal CSS/styling change, commits with `style(design): FINDING-NNN`, re-navigates to verify, and takes before/after screenshots. One commit per fix, fully bisectable.
-
-The self-regulation heuristic is tuned for design work — CSS-only changes get a free pass (they are inherently safe and reversible), but changes to component JSX/TSX files count against the risk budget. Hard cap at 30 fixes. If the risk score exceeds 20%, it stops and asks.
-
-```
-You:   /qa-design-review https://myapp.com
-
-Claude: [Runs full design audit — same output as /plan-design-review]
-        Design Score: C  |  AI Slop Score: D
-        12 findings (4 high, 5 medium, 3 polish)
-
-        Fixing 9 design issues...
-
-        style(design): FINDING-001 — replace 3-column icon grid with asymmetric layout
-        style(design): FINDING-002 — add heading scale 48/32/24/18/16
-        style(design): FINDING-003 — remove gradient hero, use bold typography
-        style(design): FINDING-004 — add second font for headings
-        style(design): FINDING-005 — vary border-radius by element role
-        style(design): FINDING-006 — left-align body text, reserve center for headings
-        style(design): FINDING-007 — add hover/focus states to all interactive elements
-        style(design): FINDING-008 — add prefers-reduced-motion media query
-        style(design): FINDING-009 — set max content width to 680px for body text
-
-        Final audit:
-        Design Score: C → B+  |  AI Slop Score: D → A
-        9 fixes applied (8 verified, 1 best-effort). 3 deferred.
-
-        [Report with before/after screenshots saved to .gstack/design-reports/]
-```
-
-Nine commits, each touching one concern. The AI Slop score went from D to A because the three most recognizable patterns (gradient hero, 3-column grid, uniform radius) are gone. The design score improved two grades because the typography now has a scale, the spacing has hierarchy, and interactive elements have proper states.
-
----
-
-## `/review`
-
-This is my **paranoid staff engineer mode**.
-
-Passing tests do not mean the branch is safe.
-
-`/review` exists because there is a whole class of bugs that can survive CI and still punch you in the face in production. This mode is not about dreaming bigger. It is not about making the plan prettier. It is about asking:
-
-**What can still break?**
-
-This is a structural audit, not a style nitpick pass. I want the model to look for things like:
-
-* N+1 queries
-* stale reads
-* race conditions
-* bad trust boundaries
-* missing indexes
-* escaping bugs
-* broken invariants
-* bad retry logic
-* tests that pass while missing the real failure mode
-
-### Example
-
-Suppose the smart listing flow is implemented and the tests are green.
-
-`/review` should still ask:
-
-* Did I introduce an N+1 query when rendering listing photos or draft suggestions?
-* Am I trusting client-provided file metadata instead of validating the actual file?
-* Can two tabs race and overwrite cover-photo selection or item details?
-* Do failed uploads leave orphaned files in storage forever?
-* Can the "exactly one hero image" rule break under concurrency?
-* If enrichment APIs partially fail, do I degrade gracefully or save garbage?
-* Did I accidentally create a prompt injection or trust-boundary problem by pulling web data into draft generation?
-
-That is the point of `/review`.
-
-I do not want flattery here.
-I want the model imagining the production incident before it happens.
-
----
-
-## `/ship`
-
-This is my **release machine mode**.
-
-Once I have decided what to build, nailed the technical plan, and run a serious review, I do not want more talking. I want execution.
-
-`/ship` is for the final mile. It is for a ready branch, not for deciding what to build.
-
-This is where the model should stop behaving like a brainstorm partner and start behaving like a disciplined release engineer: sync with main, run the right tests, make sure the branch state is sane, update changelog or versioning if the repo expects it, push, and create or update the PR.
-
-Momentum matters here.
-
-A lot of branches die when the interesting work is done and only the boring release work is left. Humans procrastinate that part. AI should not.
-
-### Example
-
-Suppose the smart listing flow is finished.
-
-The product thinking is done.
-The architecture is done.
-The review pass is done.
-Now the branch just needs to get landed.
+## Docs
 
-That is what `/ship` is for.
-
-It takes care of the repetitive release hygiene so I do not bleed energy on:
-
-* syncing with main
-* rerunning tests
-* checking for weird branch state
-* updating changelog/version metadata
-* pushing the branch
-* opening or updating the PR
-
-At this point I do not want more ideation.
-I want the plane landed.
-
----
-
-## Greptile integration
-
-[Greptile](https://greptile.com) is a YC company that reviews your PRs automatically. It catches real bugs — race conditions, security issues, things that pass CI and blow up in production. It has genuinely saved my ass more than once. I love these guys.
-
-**Setup:** Install Greptile on your GitHub repo at [greptile.com](https://greptile.com) — it takes about 30 seconds. Once it's reviewing your PRs, gstack picks up its comments automatically. No additional configuration.
-
-The problem with any automated reviewer is triage. Greptile is good, but not every comment is a real issue. Some are false positives. Some flag things you already fixed three commits ago. Without a triage layer, the comments pile up and you start ignoring them — which defeats the purpose.
-
-gstack solves this. `/review` and `/ship` are now Greptile-aware. They read Greptile's comments, classify each one, and take action:
-
-- **Valid issues** get added to the critical findings and fixed before shipping
-- **Already-fixed issues** get an auto-reply acknowledging the catch
-- **False positives** get pushed back — you confirm, and a reply goes out explaining why it's wrong
-
-The result is a two-layer review: Greptile catches things asynchronously on the PR, then `/review` and `/ship` triage those findings as part of the normal workflow. Nothing falls through the cracks.
-
-It also learns. Every false positive you confirm gets saved to `~/.gstack/greptile-history.md`. Future runs auto-skip known FP patterns for your codebase. And `/retro` tracks Greptile's batting average over time — so you can see whether the signal-to-noise ratio is improving.
-
-### Example
-
-```
-You:   /ship
-
-Claude: [syncs main, runs tests, pre-landing review...]
-
-        Greptile found 3 comments on this PR:
-
-        [VALID] app/services/payment_service.rb:47 — Race condition:
-        concurrent charges can double-debit. Recommend DB-level advisory
-        lock around the charge block.
-        → https://github.com/you/app/pull/42#discussion_r123
-
-        [ALREADY FIXED] app/models/user.rb:12 — Missing null check
-        on email before downcase.
-        → Already fixed in commit abc1234. Auto-replying.
-
-        [FALSE POSITIVE] lib/auth.rb:88 — "Token comparison should
-        use constant-time comparison." We already use
-        ActiveSupport::SecurityUtils.secure_compare here.
-        → https://github.com/you/app/pull/42#discussion_r125
-
-        Fixing the race condition in payment_service.rb...
-        Applied advisory lock. Committed: fix: address Greptile
-        review — advisory lock on concurrent charges
-
-        The auth token comment is a false positive — we're already
-        using secure_compare.
-
-        Options for the false positive:
-          A) Reply to Greptile explaining (recommended)
-          B) Fix it anyway
-          C) Ignore
-
-You:    A
-
-Claude: Replied to Greptile. Re-running tests after the fix...
-        All tests pass. Continuing to version bump.
-
-        [creates PR with Greptile Review section in body]
-        PR: https://github.com/you/app/pull/42
-```
-
-Three Greptile comments. One real fix. One auto-acknowledged. One false positive pushed back with a reply. Total extra time: about 30 seconds. And the PR body has the full audit trail.
-
----
-
-## `/browse`
-
-This is my **QA engineer mode**.
-
-`/browse` is the skill that closes the loop. Before it, the agent could think and code but was still half blind. It had to guess about UI state, auth flows, redirects, console errors, empty states, and broken layouts. Now it can just go look.
-
-That is a real step-change. The full cycle becomes: plan, code, run the app, inspect the UI, reproduce the bug, verify the fix, ship. QA stops being "go click around manually" and becomes part of the same agentic loop. It gives the agent eyes. Now it can do the boring, high-context QA work itself: click through the app, catch breakage, verify the fix, and keep going. That feels like having a real operator in the machine.
-
-It is a compiled binary that talks to a persistent Chromium daemon — built on [Playwright](https://playwright.dev/) by Microsoft. First call starts the browser (~3s). Every call after that: ~100-200ms. The browser stays running between commands, so cookies, tabs, and localStorage carry over.
-
-After I push a branch, I tell Claude to go check staging. It does the entire QA pass for me:
-
-```
-You:   /browse staging.myapp.com — log in, test the signup flow, and check
-       every page I changed in this branch
-
-Claude: [18 tool calls, ~60 seconds]
-
-        > browse goto https://staging.myapp.com/signup
-        > browse snapshot -i
-        > browse fill @e2 "test@example.com"
-        > browse fill @e3 "password123"
-        > browse click @e5                    (Submit)
-        > browse screenshot /tmp/signup.png
-        > Read /tmp/signup.png
-
-        Signup works. Redirected to onboarding. Now checking changed pages.
-
-        > browse goto https://staging.myapp.com/dashboard
-        > browse screenshot /tmp/dashboard.png
-        > Read /tmp/dashboard.png
-        > browse console
-
-        Dashboard loads. No console errors. Charts render with sample data.
-
-        > browse goto https://staging.myapp.com/settings/billing
-        > browse screenshot /tmp/billing.png
-        > Read /tmp/billing.png
-
-        Billing page loads. Plan selector shows Free/Pro/Enterprise.
-        Stripe elements render correctly.
-
-        > browse goto https://staging.myapp.com/api/health
-        > browse text
-
-        API health endpoint returns {"status":"ok","version":"2.4.1"}.
-
-        All 4 pages load correctly. No console errors. No broken layouts.
-        Signup → onboarding → dashboard flow works end to end.
-```
-
-18 tool calls, about a minute. It signed up a test user, navigated every page I changed, took screenshots, read them, checked the console for errors, and verified the API. That is a full QA pass. I did not open a browser.
-
-It works for reading documentation, verifying deployments, filling out forms, taking screenshots, comparing pages across environments, and anything else where Claude needs eyes on a live URL.
-
-**Security note:** `/browse` runs a persistent Chromium session. Cookies, localStorage, and session state carry over between commands. Do not use it against sensitive production environments unless you intend to — it is a real browser with real state. The session auto-shuts down after 30 minutes of idle time.
-
-For the full command reference, technical internals, and architecture details, see [BROWSER.md](BROWSER.md).
-
----
-
-## `/qa`
-
-This is my **QA lead mode**.
-
-`/browse` gives the agent eyes. `/qa` gives it a testing methodology.
-
-The most common use case: you're on a feature branch, you just finished coding, and you want to verify everything works. Just say `/qa` — it reads your git diff, identifies which pages and routes your changes affect, spins up the browser, and tests each one. No URL required. No manual test plan. It figures out what to test from the code you changed.
-
-```
-You:   /qa
-
-Claude: Analyzing branch diff against main...
-        12 files changed: 3 controllers, 2 views, 4 services, 3 tests
-
-        Affected routes: /listings/new, /listings/:id, /api/listings
-        Detected app running on localhost:3000.
-
-        [Tests each affected page — navigates, fills forms, clicks buttons,
-        screenshots, checks console errors]
-
-        QA Report: 3 routes tested, all working.
-        - /listings/new: upload + enrichment flow works end to end
-        - /listings/:id: detail page renders correctly
-        - /api/listings: returns 200 with expected shape
-        No console errors. No regressions on adjacent pages.
-```
-
-Four modes:
-
-- **Diff-aware** (automatic on feature branches) — reads `git diff main`, identifies affected pages, tests them specifically. The fastest path from "I just wrote code" to "it works."
-- **Full** — systematic exploration of the entire app. 5-15 minutes depending on app size. Documents 5-10 well-evidenced issues.
-- **Quick** (`--quick`) — 30-second smoke test. Homepage + top 5 nav targets. Loads? Console errors? Broken links?
-- **Regression** (`--regression baseline.json`) — run full mode, then diff against a previous baseline. Which issues are fixed? Which are new? What's the score delta?
-
-```
-You:   /qa https://staging.myapp.com
-
-Claude: [Explores 12 pages, fills 3 forms, tests 2 flows]
-
-        QA Report: staging.myapp.com — Health Score: 72/100
-
-        Top 3 Issues:
-        1. CRITICAL: Checkout form submits with empty required fields
-        2. HIGH: Mobile nav menu doesn't close after selecting an item
-        3. MEDIUM: Dashboard chart overlaps sidebar below 1024px
-
-        [Full report with screenshots saved to .gstack/qa-reports/]
-```
-
-Reports and screenshots accumulate in `.gstack/qa-reports/` so you can track quality over time and compare runs.
-
-**Testing authenticated pages:** Use `/setup-browser-cookies` first to import your real browser sessions, then `/qa` can test pages behind login.
-
----
-
-## `/setup-browser-cookies`
-
-This is my **session manager mode**.
-
-Before `/qa` or `/browse` can test authenticated pages, they need cookies. Instead of manually logging in through the headless browser every time, `/setup-browser-cookies` imports your real sessions directly from your daily browser.
-
-It auto-detects installed Chromium browsers (Comet, Chrome, Arc, Brave, Edge), decrypts cookies via the macOS Keychain, and loads them into the Playwright session. An interactive picker UI lets you choose exactly which domains to import — no cookie values are ever displayed.
-
-```
-You:   /setup-browser-cookies
-
-Claude: Cookie picker opened — select the domains you want to import
-        in your browser, then tell me when you're done.
-
-        [You pick github.com, myapp.com in the browser UI]
-
-You:    done
-
-Claude: Imported 2 domains (47 cookies). Session is ready.
-```
-
-Or skip the UI entirely:
-
-```
-You:   /setup-browser-cookies github.com
-
-Claude: Imported 12 cookies for github.com from Comet.
-```
-
-First import per browser triggers a macOS Keychain prompt — click "Allow" or "Always Allow."
-
----
-
-## `/retro`
-
-This is my **engineering manager mode**.
-
-At the end of the week I want to know what actually happened. Not vibes — data. `/retro` analyzes commit history, work patterns, and shipping velocity and writes a candid retrospective.
-
-It is team-aware. It identifies who is running the command, gives you the deepest treatment on your own work, then breaks down every contributor with specific praise and growth opportunities — the kind of feedback you would actually give in a 1:1. It computes metrics like commits, LOC, test ratio, PR sizes, and fix ratio. It detects coding sessions from commit timestamps, finds hotspot files, tracks shipping streaks, and identifies the biggest ship of the week.
-
-```
-You:   /retro
-
-Claude: Week of Mar 1: 47 commits (3 contributors), 3.2k LOC, 38% tests, 12 PRs, peak: 10pm | Streak: 47d
-
-        ## Your Week
-        32 commits, +2.4k LOC, 41% tests. Peak hours: 9-11pm.
-        Biggest ship: cookie import system (browser decryption + picker UI).
-        What you did well: shipped a complete feature with encryption, UI, and
-        18 unit tests in one focused push...
-
-        ## Team Breakdown
-
-        ### Alice
-        12 commits focused on app/services/. Every PR under 200 LOC — disciplined.
-        Opportunity: test ratio at 12% — worth investing before payment gets more complex.
-
-        ### Bob
-        3 commits — fixed the N+1 query on dashboard. Small but high-impact.
-        Opportunity: only 1 active day this week — check if blocked on anything.
-
-        [Top 3 team wins, 3 things to improve, 3 habits for next week]
-```
-
-It saves a JSON snapshot to `.context/retros/` so the next run can show trends. Run `/retro compare` to see this week vs last week side by side.
-
----
-
-## `/document-release`
-
-This is my **technical writer mode**.
-
-After `/ship` creates the PR but before it merges, `/document-release` reads every documentation file in the project and cross-references it against the diff. It updates file paths, command lists, project structure trees, and anything else that drifted. Risky or subjective changes get surfaced as questions — everything else is handled automatically.
-
-```
-You:   /document-release
-
-Claude: Analyzing 21 files changed across 3 commits. Found 8 documentation files.
-
-        README.md: updated skill count from 9 to 10, added new skill to table
-        CLAUDE.md: added new directory to project structure
-        CONTRIBUTING.md: current — no changes needed
-        TODOS.md: marked 2 items complete, added 1 new item
-
-        All docs updated and committed. PR body updated with doc diff.
-```
-
-It also polishes CHANGELOG voice (without ever overwriting entries), cleans up completed TODOS, checks cross-doc consistency, and asks about VERSION bumps only when appropriate.
-
----
+| Doc | What it covers |
+|-----|---------------|
+| [Skill Deep Dives](docs/skills.md) | Philosophy, examples, and workflow for every skill (includes Greptile integration) |
+| [Architecture](ARCHITECTURE.md) | Design decisions and system internals |
+| [Browser Reference](BROWSER.md) | Full command reference for `/browse` |
+| [Contributing](CONTRIBUTING.md) | Dev setup, testing, contributor mode, and dev mode |
+| [Changelog](CHANGELOG.md) | What's new in every version |
 
 ## Troubleshooting
 
-**Skill not showing up in Claude Code?**
-Run `cd ~/.claude/skills/gstack && ./setup` (or `cd .claude/skills/gstack && ./setup` for project installs). This rebuilds symlinks so Claude can discover the skills.
-
-**`/browse` fails or binary not found?**
-Run `cd ~/.claude/skills/gstack && bun install && bun run build`. This compiles the browser binary. Requires Bun v1.0+.
-
-**Project copy is stale?**
-Run `/gstack-upgrade` — it updates both the global install and any vendored project copy automatically.
-
-**`bun` not installed?**
-Install it: `curl -fsSL https://bun.sh/install | bash`
-
-## Upgrading
-
-Run `/gstack-upgrade` in Claude Code. It detects your install type (global or vendored), upgrades, syncs any project copies, and shows what's new.
+**Skill not showing up?** `cd ~/.claude/skills/gstack && ./setup`
 
-Or set `auto_upgrade: true` in `~/.gstack/config.yaml` to upgrade automatically whenever a new version is available.
-
-## Uninstalling
-
-Paste this into Claude Code:
-
-> Uninstall gstack: remove the skill symlinks by running `for s in browse plan-ceo-review plan-eng-review plan-design-review design-consultation review ship retro qa qa-only qa-design-review setup-browser-cookies document-release; do rm -f ~/.claude/skills/$s; done` then run `rm -rf ~/.claude/skills/gstack` and remove the gstack section from CLAUDE.md. If this project also has gstack at .claude/skills/gstack, remove it by running `for s in browse plan-ceo-review plan-eng-review plan-design-review review ship retro qa qa-only qa-design-review setup-browser-cookies document-release; do rm -f .claude/skills/$s; done && rm -rf .claude/skills/gstack` and remove the gstack section from the project CLAUDE.md too.
-
-## Development
-
-See [CONTRIBUTING.md](CONTRIBUTING.md) for setup, testing, and dev mode. See [ARCHITECTURE.md](ARCHITECTURE.md) for design decisions and system internals. See [BROWSER.md](BROWSER.md) for the browse command reference.
-
-### Testing
-
-```bash
-bun test                     # free static tests (<5s)
-EVALS=1 bun run test:evals   # full E2E + LLM evals (~$4, ~20min)
-bun run eval:watch            # live dashboard during E2E runs
-```
+**`/browse` fails?** `cd ~/.claude/skills/gstack && bun install && bun run build`
 
-E2E tests stream real-time progress, write machine-readable diagnostics, and persist partial results that survive kills. See CONTRIBUTING.md for the full eval infrastructure.
+**Stale install?** Run `/gstack-upgrade` — or set `auto_upgrade: true` in `~/.gstack/config.yaml`
 
 ## License
 
-MIT
+MIT. Free forever. Go build something.
diff --git a/SKILL.md b/SKILL.md
index c0d6e267..72bdb682 100644
--- a/SKILL.md
+++ b/SKILL.md
@@ -28,22 +28,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
diff --git a/TODOS.md b/TODOS.md
index a0801d85..8616f906 100644
--- a/TODOS.md
+++ b/TODOS.md
@@ -386,6 +386,16 @@
 **Priority:** P2
 **Depends on:** None
 
+### Cross-platform URL open helper
+
+**What:** `gstack-open-url` helper script — detect platform, use `open` (macOS) or `xdg-open` (Linux).
+
+**Why:** The first-time Completeness Principle intro uses macOS `open` to launch the essay. If gstack ever supports Linux, this silently fails.
+
+**Effort:** S (human: ~30 min / CC: ~2 min)
+**Priority:** P4
+**Depends on:** Nothing
+
 ### CDP-based DOM mutation detection for ref staleness
 
 **What:** Use Chrome DevTools Protocol `DOM.documentUpdated` / MutationObserver events to proactively invalidate stale refs when the DOM changes, without requiring an explicit `snapshot` call.
@@ -458,6 +468,20 @@ Shipped as `/design-consultation` on garrytan/design branch. Renamed from `/setu
 **Priority:** P2
 **Depends on:** Ship Confidence Dashboard (shipped)
 
+## Completeness
+
+### Completeness metrics dashboard
+
+**What:** Track how often Claude chooses the complete option vs shortcut across gstack sessions. Aggregate into a dashboard showing completeness trend over time.
+
+**Why:** Without measurement, we can't know if the Completeness Principle is working. Could surface patterns (e.g., certain skills still bias toward shortcuts).
+
+**Context:** Would require logging choices (e.g., append to a JSONL file when AskUserQuestion resolves), parsing them, and displaying trends. Similar pattern to eval persistence.
+
+**Effort:** M (human) / S (CC)
+**Priority:** P3
+**Depends on:** Boil the Lake shipped (v0.6.1)
+
 ## Completed
 
 ### Phase 1: Foundations (v0.2.0)
diff --git a/VERSION b/VERSION
index 758efdb4..ee6cdce3 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.6.0.1
+0.6.1
diff --git a/browse/SKILL.md b/browse/SKILL.md
index 33accc09..50198d5f 100644
--- a/browse/SKILL.md
+++ b/browse/SKILL.md
@@ -28,22 +28,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
diff --git a/design-consultation/SKILL.md b/design-consultation/SKILL.md
index f04e2213..8fd9cb4b 100644
--- a/design-consultation/SKILL.md
+++ b/design-consultation/SKILL.md
@@ -2,7 +2,7 @@
 name: design-consultation
 version: 1.0.0
 description: |
-  Design consultation: understands your product, researches competitors, proposes a
+  Design consultation: understands your product, researches the landscape, proposes a
   complete design system (aesthetic, typography, color, layout, spacing, motion), and
   generates font+color preview pages. Creates DESIGN.md as your project's design source
   of truth. For existing sites, use /plan-design-review to infer the system instead.
@@ -31,22 +31,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
@@ -158,7 +197,7 @@ Ask the user a single question that covers everything you need to know. Pre-fill
 3. "Want me to research what top products in your space are doing for design, or should I work from my design knowledge?"
 4. **Explicitly say:** "At any point you can just drop into chat and we'll talk through anything — this isn't a rigid form, it's a conversation."
 
-If the README or brainstorm gives you enough context, pre-fill and confirm: *"From what I can see, this is [X] for [Y] in the [Z] space. Sound right? And would you like me to research competitors, or should I work from what I know?"*
+If the README or brainstorm gives you enough context, pre-fill and confirm: *"From what I can see, this is [X] for [Y] in the [Z] space. Sound right? And would you like me to research what's out there in this space, or should I work from what I know?"*
 
 ---
 
@@ -166,7 +205,7 @@ If the README or brainstorm gives you enough context, pre-fill and confirm: *"Fr
 
 If the user wants competitive research:
 
-**Step 1: Identify competitors via WebSearch**
+**Step 1: Identify what's out there via WebSearch**
 
 Use WebSearch to find 5-10 products in their space. Search for:
 - "[product category] website design"
@@ -175,17 +214,17 @@ Use WebSearch to find 5-10 products in their space. Search for:
 
 **Step 2: Visual research via browse (if available)**
 
-If the browse binary is available (`$B` is set), visit the top 3-5 competitor sites and capture visual evidence:
+If the browse binary is available (`$B` is set), visit the top 3-5 sites in the space and capture visual evidence:
 
 ```bash
-$B goto "https://competitor-site.com"
-$B screenshot "/tmp/design-research-competitor-name.png"
+$B goto "https://example-site.com"
+$B screenshot "/tmp/design-research-site-name.png"
 $B snapshot
 ```
 
-For each competitor, analyze: fonts actually used, color palette, layout approach, spacing density, aesthetic direction. The screenshot gives you the feel; the snapshot gives you structural data.
+For each site, analyze: fonts actually used, color palette, layout approach, spacing density, aesthetic direction. The screenshot gives you the feel; the snapshot gives you structural data.
 
-If a competitor site blocks the headless browser or requires login, skip it and note why.
+If a site blocks the headless browser or requires login, skip it and note why.
 
 If browse is not available, rely on WebSearch results and your built-in design knowledge — this is fine.
 
@@ -194,7 +233,7 @@ If browse is not available, rely on WebSearch results and your built-in design k
 The goal of research is NOT to copy. It is to get in the ballpark — to understand the visual language users in this category already expect. This gives you the baseline. The interesting design work starts after you have the baseline: deciding where to follow conventions (so the product feels literate) and where to break from them (so the product is memorable).
 
 Summarize conversationally:
-> "I looked at [competitors]. Here's the landscape: they converge on [patterns]. Most of them feel [observation — e.g., interchangeable, polished but generic, etc.]. The opportunity to stand out is [gap]. Here's where I'd play it safe and where I'd take a risk..."
+> "I looked at what's out there. Here's the landscape: they converge on [patterns]. Most of them feel [observation — e.g., interchangeable, polished but generic, etc.]. The opportunity to stand out is [gap]. Here's where I'd play it safe and where I'd take a risk..."
 
 **Graceful degradation:**
 - Browse available → screenshots + snapshots + WebSearch (richest research)
diff --git a/design-consultation/SKILL.md.tmpl b/design-consultation/SKILL.md.tmpl
index 0ffb121c..141a9190 100644
--- a/design-consultation/SKILL.md.tmpl
+++ b/design-consultation/SKILL.md.tmpl
@@ -2,7 +2,7 @@
 name: design-consultation
 version: 1.0.0
 description: |
-  Design consultation: understands your product, researches competitors, proposes a
+  Design consultation: understands your product, researches the landscape, proposes a
   complete design system (aesthetic, typography, color, layout, spacing, motion), and
   generates font+color preview pages. Creates DESIGN.md as your project's design source
   of truth. For existing sites, use /plan-design-review to infer the system instead.
@@ -76,7 +76,7 @@ Ask the user a single question that covers everything you need to know. Pre-fill
 3. "Want me to research what top products in your space are doing for design, or should I work from my design knowledge?"
 4. **Explicitly say:** "At any point you can just drop into chat and we'll talk through anything — this isn't a rigid form, it's a conversation."
 
-If the README or brainstorm gives you enough context, pre-fill and confirm: *"From what I can see, this is [X] for [Y] in the [Z] space. Sound right? And would you like me to research competitors, or should I work from what I know?"*
+If the README or brainstorm gives you enough context, pre-fill and confirm: *"From what I can see, this is [X] for [Y] in the [Z] space. Sound right? And would you like me to research what's out there in this space, or should I work from what I know?"*
 
 ---
 
@@ -84,7 +84,7 @@ If the README or brainstorm gives you enough context, pre-fill and confirm: *"Fr
 
 If the user wants competitive research:
 
-**Step 1: Identify competitors via WebSearch**
+**Step 1: Identify what's out there via WebSearch**
 
 Use WebSearch to find 5-10 products in their space. Search for:
 - "[product category] website design"
@@ -93,17 +93,17 @@ Use WebSearch to find 5-10 products in their space. Search for:
 
 **Step 2: Visual research via browse (if available)**
 
-If the browse binary is available (`$B` is set), visit the top 3-5 competitor sites and capture visual evidence:
+If the browse binary is available (`$B` is set), visit the top 3-5 sites in the space and capture visual evidence:
 
 ```bash
-$B goto "https://competitor-site.com"
-$B screenshot "/tmp/design-research-competitor-name.png"
+$B goto "https://example-site.com"
+$B screenshot "/tmp/design-research-site-name.png"
 $B snapshot
 ```
 
-For each competitor, analyze: fonts actually used, color palette, layout approach, spacing density, aesthetic direction. The screenshot gives you the feel; the snapshot gives you structural data.
+For each site, analyze: fonts actually used, color palette, layout approach, spacing density, aesthetic direction. The screenshot gives you the feel; the snapshot gives you structural data.
 
-If a competitor site blocks the headless browser or requires login, skip it and note why.
+If a site blocks the headless browser or requires login, skip it and note why.
 
 If browse is not available, rely on WebSearch results and your built-in design knowledge — this is fine.
 
@@ -112,7 +112,7 @@ If browse is not available, rely on WebSearch results and your built-in design k
 The goal of research is NOT to copy. It is to get in the ballpark — to understand the visual language users in this category already expect. This gives you the baseline. The interesting design work starts after you have the baseline: deciding where to follow conventions (so the product feels literate) and where to break from them (so the product is memorable).
 
 Summarize conversationally:
-> "I looked at [competitors]. Here's the landscape: they converge on [patterns]. Most of them feel [observation — e.g., interchangeable, polished but generic, etc.]. The opportunity to stand out is [gap]. Here's where I'd play it safe and where I'd take a risk..."
+> "I looked at what's out there. Here's the landscape: they converge on [patterns]. Most of them feel [observation — e.g., interchangeable, polished but generic, etc.]. The opportunity to stand out is [gap]. Here's where I'd play it safe and where I'd take a risk..."
 
 **Graceful degradation:**
 - Browse available → screenshots + snapshots + WebSearch (richest research)
diff --git a/docs/images/github-2013.png b/docs/images/github-2013.png
new file mode 100644
index 0000000000000000000000000000000000000000..186324ba71bbb234778c2e9c185bef82f66d663b
GIT binary patch
literal 63425
zcmeFZbyytBwg-wPNP-3?!6CQ}5L|<W;5rO85M+?xHaLU?3j_%65D4yWgCw}SYjAh>
zH#z5?d(YW#@BO{^|Cz6wuI?`BT5DC+TEAM0&nikXPq9d_kdTm`%D$CSLqbA_At51u
z#dw5xf|bbciiGq;$wE?6MOIRhO2xs})WQmig!J}v4EV8@dN*;Zu9_?cUeJf=p(H9A
zx)0HKI!Ig6crjnmFz7n`z8T2?i1gq=@1()v&ma(FZL8dZV%FgKDpq2RXy>wb-~~UV
z`dyYqp+&xn`-`+!56O=Eb6iLqf@oaY?D^=gQ@IT&NC|$Veobzn7eUAPhD>~jrjL>?
z(GeOJhBWkO(5HrP@*7`eZy0lt&-nv*l=w4|1kzXYpiyZoLy9&r<PUt<&|^=eAg(T5
zg~7PIL!BV!HICOo1t5O)&?FE)Bougl)7E)R<&A-qK#$k;3VCSPR~Y^}9@F_bhwd*{
zBH2v58_C_II6e^Ck!O%~I&N}Q`p8D6&-bV+zW!5cMPDjMi~`3kK8J5o)V)M~w_?3V
z&1^uh0Ds_9t4dZk^Fn4bt(rgq^;S^)qaz^;cavvrf=J(LrN$0QS_)aA<{xJ$tB9Cg
zOHB_&QJs=$_`<|~bOxjOF5!`iCsX%_etCY#)bkas!1LYRkb|tK7=@8nP(gd}w_4=1
zmE*j!Pbd1lUr%aLZwY-H#2&@m1E5MM;G*y?lh0SE*YWCxnw|u08bPSow4WpJEG5YD
zx;|r59?G)yElcBEcg2+D>#<VDhGbDAzxOI+m82jO`qeC?%o#5P6P9lYC;Jh1T(K-U
zUe!W@g?@L`s#i);7M;YA`%+UO=y{(sEzT3Qjj*Wp5kG#O@SWacRHJcYdk<}!(+^@4
zR0B^{kJj-zS+JHLbrP?(w&zWBhCr`|kGA=bf~~~0Dg`M##e$H8@i3-dW9kaVW0m`6
z7Qxd=_47PF`XY6S)8nCbBAePtsriIIqgZ)OeMv~esq!Qgd-H(k6H1p4MMpk=H(rjY
z;Kwh%qA_wfu4wiY7?0}?b*4*b$%Cozh5f#)QsQI2BWxjaFjPN#@bLb6*JDRb$oYfu
zv6;!MM<Soa+g=+na>knnk}fyZ@=+j%-<Q_?BAavM2rs$!lktPKc(s5e9xtswla27y
zie3?aJcdh=t9)H^_OmEGo0Q_i&1>h}FBNu@zk=W`Znd?P$<t5E8+>a)AVb{Id)-Hi
zbLq%p!LQJ>zI?k>w+aj&tDJNqRZ|_mp1saBR;0}5v&}WTylt?}2Y%c*TuPlH*rkF!
z67o%HO)Pu#qa(~PREq^B<sYay*LqLH$FFPUBP^g|cA0qPZU&0c;GYz95%5vFSPL;*
zEueU_pfRmbNBfE;t>53^31<?JNHEk0&JV9e{dRqyYhYVqbluE?QE<jmbBK%N8FqGd
zc6S?tE%fL|IK^R%-6e}zuWuUhQ=|b3V&*mU_c&m3jKlt)AC%LOIgp8e5U;PG%=z*i
zJ{G5XBIWD)^$C6JX2mbTxKCT}c(ss%#hJ7)Cw#F=(XAejzXS3kk-UDzkL-=S@l)E4
zXzpV{4xuor$giiDK~xx+=`R)9kT|6a@gBFKFHtqU#Ut=-qv?K268ZTpJ{=dSc2G1;
zK?IfwsoJO8AhI_~R2yGmtMm@ITN3&-lqyfM((7|M--m|15nu#7m01~<HK!MR$|eO!
z?;Uoi#G3y!@ttAlWD``0>J@Nqgf#j?EB?iLkUa+lv47UP7x83CAu;cuT11+GJU?$d
zU+ny-FT3E!H(R!v!!Q1&B8&`J9zCqP<Z3`E>DW0^zl7dWEPV2z9>RQs_V^>fS2_N5
z7p(%rGr}GWA<RIGoTZ8}SyxF~0&OYMjK`kDQJ<&VwA-L<ifvwPD{Zi4R3qSLDK093
zubyvJX_1-IG!$lD&qxZssh8TOZG36@Rk53W^_>Hjwj4W6T!c$hcqA}_GD=LXl2P*+
zQ0|$uRD!Iw__Vl1hTb<PHBq&yJYEgT_rg3$^&fPUioU02FJw233=MHi9*zYKe>Lx$
zWSpETvDaKl?eIv%=}+zWo;4C(xmF3OT&YZ|1Um`NC+;gNr*DkLjaqIpY`JV5a3>@x
zC3-4GtPA(c^}F}WCl0=N7C`i=H@=V2B$^Y4i=Cssicx1mN0`lbLa#`!s8wgO%DpOK
z#<=o(<w<3n#leJV&Ye_Xrg0Hr=F1W7%nHax<^U>vN9DWYc!_n1b)0nz(;Rly$v1H&
zNkzK(aBz)cjf}F)APA^x8=#-HfZvEi+)-|Nq+M4?RESz=S%~}ci;SI2kPIuiD&O)*
zP|fwrv%9nQYr5;3(~@l;j(4PJFIJxya+!0~8V8Zikaj#*;+wN_ohkLm+<$uz(Go%T
z68FpPJO)oWUocN1v~oUoJa=-cjlWIHwBhGvrhN@&Z`&g6tVvO~Y81PAc3w$dn^Vyi
z=V*?V2ya|UFS}Wq(M9}=1ph>){_2FP1TXFyPGt@t*P@ws=g0Ry%eqRnEQgJTjV;~_
zEI3p{i`EV_pRt62V#nPJUTNAESr<kX0(AMb#L9+imS&&LjLpndXU$$uD^(PgHyX)Q
zu1u{>S(n4j!)M^rX4Bvq1H0GcbL6x*Nn|rJ_;1|8BE#}YoaZCfyPR3=3Y{A^+8l!I
zm>u5Rxr@#?IQ49Tz7Kx6U*26$-f3vPns}bVX=ohW!5!+hWpqH}l;>2(6)Vc?y4z3|
zYHUy|SQ`xCgD=<_*N3|3?oKS9PtUhP_VqUw)(p2I*2{)h1ZCm~`?Wg+c4QBq942o}
z?_MqR&a*7;e3&#?2wM<XfH$Unsd&LaQDZ!ZO6f@HJII@cV^D3Ic%Zq6Blb$n*C1xm
z%Lm&h;z8-5Q%}f-*9G^&?Stb7;a@60bW;JgI0vp&#Lo$|2&RZL38V2e@SXUkg!y09
z^42o6v6*Og9jQo|yKd$W?RXkDeKlx3z&yc7B7`v~6H@^6@x8@bL?tMOxhcpgdA<8D
zXCpKtM!EtR@!G?62%Q;b=-qWr2RYl~H{*NaWy*|=%sNv)8+Ryvo+ZDa7p3x+zAZwV
zMT1Jn)4b&5DWgBKR(m(Hof(GtouMzmPIQ_>J8~{wLQYm;I$=bJ(|o!9b4s2~UVGjo
z{j@?N=hmD_Yj<5#xPqYqzJfsfo44|Evnl7Ycyzf0r`ac?eAyQmZY^gmW;8y-I;wF~
zG7UPn{H+Ye&K*$-X?;8i5N&U5sP;TTYNo_7jS#no{P}EhZZbr`t4_A==D5qv!YwdM
zaD;3tFOOc`Ou;%%peq<kKH897lr-@YH|{`#Dp)qS!xM7(eKEfh<ek$1{-vv;eQ4vp
zeER8CrP*7v%7MzXI;ZuOmR~KDrb`um6*{I#{rVg?3uODr){YT%TaLQx+I_m*C63-*
zx7+Ar=mOZ@EDr2CkW+WVk(O-fj*xYr`yr&urK&x#{djpNq!D1N{Sg?!YN0C#+X~1s
zkdvZojuniHjq%o@*E`?2Fm3`qG}*d!99I+Vv+$PC7DpF1RQK3|&ff2h`xj6azG%+&
zX7jM_o|)XqE))W<>r_KUoEsgyWZb0ORvz^}W#RM8@5-;$d7)Bg`+c}0i*(V3z`DM2
z+Q)I8c!e!XSJW!Ts<DjCMAs|E88i)BKL5BE4x`=YKSA9HOiT$7l6Uc5pqn38CD--J
z@A#f=S~I*)RApXNUTvwoof_hSdciv(FkwC0IRmbz+y(FZTpQ1XPvZDdnhSIZXkA2&
zE0f}K;>L`<JbSg{K~hd4ND@UliyKI8V{vRFcv>+!2v6)!WC`CS*S3##cN!jUGWPFu
z5AO|gN$V0m`UaKjEs7#k(ib3d%-?gm+^T3sdvG{@a?w{-A!?R1=$0aM%d#;UaI(L#
zqdTvId$)c*o6dVteT_{4AOX7TTfL{8^gfMT%p#0K1wJ_V`>frLcNOeS5){wZrn)z-
z1Z;LhCDrj6-0C0Rbn2ei657Pg4cDu~CO2)yDPcalJ9Y>B4!}eGox9qb8VU?bVUJwb
z%RI;7m)GCRJF~+rQ)`7S_ObTsFP)Z02h7UNDB&RwWA~0Lj<XwLcWVz|%R#@?0l+c9
z3mDhP<yy5<wX+kuu(<%YJznti)IA>f1v&E=xOqhxDJp!=e@D2beq{z9R5WO5p4;!;
z*@?nj{djMH{3N%U_XSeJ96FN73ncnEJ~f8?i@>{p+>6RPj9Z4n1<7;LTgSXl52u{-
zhX?C|NH;D>@1CB$$U~AEMGm?^+ng$sw6+6IHXmrbz~6sbt#qB78i#Wqns<@8*d}uO
zL?gfW-Q|@5O5!JNP2jo@!oWZ?mX%a_@)QZ#26g2CaUTrTk~LLSL}EsyF_6%ZNs!PH
zDP+VcicI>y={LxXNT~mKj)H^~Xn}<GKY5f8*WbUdi1T-ue_l}|1CSmg?g$X4>o=5t
z<wl2nL;Y78`FBnvadk;qS;SS{*Z~T)aWuDeLhYkP*gr^^c5k&Ek&uY#exJy)YP5%l
z`X?<kw4AgQ6$FiKt=SDtY>lAouGV(H>p>EB6+|Shp-zTWuGUsIj)JZtH2=sUh)Dl_
z45Xp@M;0eb5gIK;6)H(v2PhRUI|n-ljVKls6_v1qiK(EP)SLe)j<^${F?VvZ69fWX
zTwK^)Ua{Lcm;pHj1O$K_TtF@^Hbf3KM>iWMLsvE%$Cv-C<X`njK^=`9EbN>tY;CB1
z*K25G>+B>#L-V_#|NZ^*JE5)?|JRa@<NtIE(LvzvH$YBy4&eXRjVLPo`>CLcg)7ub
zTgt*3K{G@fqTC!D!vDzs|9bO(E&f|ct^X^@`AUHQ-;4g+t3MV6IYJ#IZLJY)I*I-t
zzy7E2zrXySg2KSxUH>;y{FBcAc#0sjD3&nrf0-tV_2jDdHG+?17E;O@h$}+M{_*QV
z{AEO(zpse%Lp<H}<S!(o*GRHb;u@~VyD8|&AZgML12r_lOi4U(OmQ_dG<<vwG-L}Y
zDH3tPEO>;?*1nAtUZy(97P|%BlK07gw_|(~+~s0mzR@LZsb<bGdm#CtFK?q^Bjq_S
zJ_a({YoxzEsNP|;eJCa6@bVA%h=lRsuZ|D2NQMB^zpV=83zFYF(hdhV;ICUlLZjL>
zdh(a8AX<O@0Uz->@5lqz|L${;{2*VD@sR%dz~Df^gP|6-4(a_}t`DUloJc5Ce|;do
zL29x2;QTxh`|on$!8jlNEscL*yq<bmiX-VL{x_UJYGLpAEAs#2Iofk%3^?+Hp*j0s
z^9c#jQv372Aq<i)(n};mz8`{5`qBTId`O6vo}>N^VW{xlAz1lHD=@w8?{Xo8#`y2L
zjP_rl`782J{a0xIYE1nW8VFEm_k2(2bi1I$RU2zs^5x-bHz5g+DcRmMJUkzir;zrH
z$%<&Y$^-YV&Kj-<JR6UT76dV~u;sJqH97bPgg=+Q*q_h2KHFC5cw#G4MStBOl6pO`
zL5gkcA5JNjZ8m6ix*T%UqSYcW+Zq@yMXt;w{t<29a}e^MjvC*$^muE2^C1A>aFFWv
z#*X9m4LZh$z$=rwyiwDki0?9u`7f1{Ysc~=g>txD_UF>GdNqdzAn>gV#iXr{(4=Ta
zRf(Ppas8eoKHL}}m{(#sV)W5>i?(ATmOR7n*%J$tbIl<HZQ;O48SI}mE{n(xZr5X<
zPYs)J3q4h>(~WbAxuw5|;arK`e#ll#V2t~8C8q4PF?hFb?6h)_WIlUNUTNIPUbkg6
zUEXt~c3WW-y>hpk&bx7aM#`;#aZ;dJlHMCv(sk?E0Jy5<;ISE_>H`wp-(47xh#3+<
zYF))ARIdvnqZyQKYGxlc(q=2YTWu?CACPC@wv;KtZoyn;-r#Bh%UIS^?Xry17HnWG
zTR7UEO})OGGE_a7@Fd;`@o~$s<9ddAr~TLC1)zwv9&dG79dCEt?mWW4z2MTW6YJ1K
zr`0Y_xT_Z(xR{LF=Jc)mUKRLk)4a@cc~y3%!YplWl1!j{barbr(4%={K=(D9t{7nA
zVt>X|`;82dVO&uaxI~-ff)kV<&5mxm@OS}$!%91lCZx{(_{0anY=avS<8`a|7mf_!
zNu=E0fL@SmmKrzM?wm9cGsrP%0JAmlX*L2>xrpC5XjUFpR@5E(*^Hxo<$kvNCWhJ5
zxM&BvGc4`fjPv&BwByE^IUGtM|6K;>d)w#5(vVK9KbxgrpVIx7lYSqoEZgRSE$48j
z{nJ-o7uF!{Vu`i)vF)jRL|ZNFx;Wrsop}P?OGhgh?pNNuB&T0L#ILPa=nJ-;wnj$g
zrbn5Uc1m>ZhYbza3kAliy=3YN8r_|;<cN9$J!&Y0J>Np=&%fP0#u>U;1m$3@^=dmy
zBk1A3Yt$~^1B+n?MLxpaHLFr(E6trOk^#D(ZgN(cFZemE^`%FCJfBowyfV&_2_upB
zy1}jFZKp9`XsGiS`r=V(F-keX+4rK}dF$<XzGn4tKKlM_Nv~$+&BZ}4WA(^g{TTQe
zgAJKsBRp0qMX;!Rq;N~!<WAGCn!{}0^Zj^sBQat5rqa}WlNST1@VF=@ZSd8!e+*|c
zKfkwL13!MTti~^1Hi&RqB%NY@#^Il?xp<+NQUZpPNllm8Mnp4Jmf@`Bb_=XMsUk^y
z?H0WgVtLy&i@jXZe&#}kyNm_5;h{+*<!dZ!g1T!;WMTpO?pt&$DMd%jpgbE)aYd4c
zw_-dt=2<d<=muEuR9E!K(j5!2uj?KtR(m?PCmWizt${c+u-=T8(H!MGML13@5l`pN
z#4l!p{+ToL)__olm_c;OM`tx*F0g_j@!F|)5wlbU<v4b>BJH|pqxN9B$t$tyb(_WX
zDCdD+wI<z>I{RdEnDCeaZ?mg#Q_JQ3c|l$Fx3xIls)u*D&aC!24_v;Z_<uU@WdMCY
z5W$>#^<`9f3+MB&TSL|dv#q8VqNJxwY|fLZz4fL)+RRQY?zItv9wM`P^X#M69nR)m
zUX282g=nZ%Uiz2rSe22o35sIvnKa*j@>AaDESF}}<<5F!)FRmVW7(#RfR3$T*53Gy
z%CK^<*7P}cb2Va?`nqF91c!|~FibMD?#Ht0E;#fqZ$^qg$bA@m;pO4NaGo^VBx$By
z!eV&Q;vb?>YNwiz%Am}iC}Nzi2fI~v!9TKJ3f}}DMPmMi_K2c3RW)sO>Rg9a>GL2y
z{V9aFFWu?@dX~@U7MVrDBPm5i?54G=x>O<=m}in#?l8`&xVE%tIa#c}fGbv>;RMFf
zG<i;JvrsS1N<b;%{)HV<FV!8z5O)(L;7HHut41GOr2R-xvy=6Ht{S4W3sbt>TvhI_
z^9-mN9R<@hXYwt)UDc8*eyBcj5rpm5>X`ztgx%&+8$B#G2IebW9=zplJ4jEfb3fgE
z&Q?fhDaJX^b3a*EoM|*Gxm8FZ4DmT<TI)M%>Wib1#$vu&+i;k+7aC0UuXNc-o83I!
zdZn>Ds=S(W^niI}J#(6HdO7@ZYk#@ID6QxCHjO1@{(Ht=K|31wwl_mJaV&4knDZyd
z_x6hM&6nqz+EqUYE%z44jpiZw8nQKM6%}2b!UCS^#ZTxI;=k4w?RtN@@tE`b%oXZ?
z%atYH4ZSZ>+M`_M+R!fLkoq;4_8{4lNLLXfWAID)Ar5Fj$I3a_?XIn&aI>DIk<n%r
z&DlEZu4$QY;rxA*562%H5b4zyy8>@(I=U}IXS(qC`4L?rg>knl;(JCK?$FOqkGGby
zdZX`)YBp28yvSU9*Lhz}^2_umVzwynFXlDK(U;VzfHf-UG}y5>#_@y{SdHb$yCe!j
z6BQgQ-S<XqkwQsCl(Opx0|iulB3kdb9j1WgPaZBnTMi>R?7A1Y6hq4OYVo4Ru`-4(
zk><)~!|XVy*Js(~2v7yu`9LA&t#Dw9DNwD&Em~`vV@zE5>Cd!fDM=J$rrlydn!*E>
zXv+F8Sy$)Dv~<kYICg{VMem!GR1pt)f6)2#7ISG(B9BLx!i9xePDUu{L~YMHr_Ild
z_OU`Y%Nn;S3ERUT_Y+b^?j56M18R2xp{y(tB8qH$mLowVyty)*#vK}}$8laO<?U>N
z<I5Gt)q6r(Hf$!D=LXH9B3WH|8PP#m6XZVFUK(HN?*uj9?93W2h5FYb7FjLnsW_W7
zed>u&0f&vKBLh$U<N#c9tF>YO`MfBGt|nEKf|#ubY;<gd&=||8&DGlPMFu<}7ysn_
zf_Y_%vRr7fM#TNRtZg=?7a(7z4!GZC9@mV{ZMM04ln=`BRj^+hJiGt&cueQ=9mqzs
zlDSZt`035rzF{4T3MMvyEj_zmw|m?d^*YE~OwPDNNu?Xsya+0JBUWR(a;o-0dg>na
z5oVcZ1H{|Q|3>n{zA&dw$Fx_&#cLyk7e136tXly~dDd|iU(BelQtN@4p?i+=LilyV
z>7@k7@N+p?nc+M$b!kr7$f>`~a+YLvp@7LV?7|zEZN(htA*X7kIsSE-p;y7vbWFIF
ztkuoKBcsnNqvP0^O6veBY0;<lz@IA~J+v2I7Z2NqsDEa3;XTDbOD^q2QOYZ6E;CKO
zFv;2|ewZkFPz<s?gF3kS8G;Tdb*t5?wy6ml1%e}(!*doDlODcp^Sqyi8vcB%_$!k@
zi#t`sl7vn%Qc4;>q}~d&%Y2}1SXU5e+is!?Y0p%3A3~qBGAgHs-u1<Pw_k26BQ&T>
zCJ=C|gYLj8<+Yl(3FYkJQM9ss-O&s#O4JkQUwf}%BU$o08reqv4rA$Fx>wWnLiQ>E
z*ooKI$@1K_ryQi6cSU-6C}+D1{!vAE_=a)lg2a&}`i-WYLXi4O&AXk+!mqulevoQb
zc5qWU4-B;Aw6$AjC#;JGj28-7ZV%}!;M%0gTQKXpUyCzv*nR~joZ+z=^NTIf%F3s$
z=J47ZpQKgyV&xQDe;$jcX~@@LjU!Jg(fb_^(XO+?Z#+?YqrJM+DieLxh*uW-GK^B-
zb(wJ|Om{vIU96hF1XA^7B*#a7eXW~VJ@c&%n4Q~jlD#5{NOaNpU^<EZR#1E0e7^j}
zc!BP$qK(v_4?GqW34V;+Qulrx-I>#ap5_^6QrCHyA)Oh^5tOMQ4E6EDaXk+E;cD~4
z?zVQdr$6}Y5H{|8SW=2rg$c$g4||MDG2?e>1@<{;x+}VNqwE3azmEY-cvkPtx=i`m
zF`no(ICb+{wK1}!>;TyD3y&M9=%dT!OH?bW6)$fqkCVlGerjgxNwX+_qVy>r8Eg5H
zP*LQh4<jP0dD&*3Was=2?sAaYH*nLkG*RSJSWi~N^ZrzeMUgY<l}i(AE7ZT#JgNCz
zIwTdLvD-xwdB5PAlLOdb7rJ)(?~AzWUWJi~n8tbDwqdgD<z%z%j*RupIPVk*t7j{L
zhmXNpPjoFBD1}XJ7Ms{c{S3^K@bvaZZq7-~!QMYx+F@H)SkJ1D_|=~H^OP!LY-y&l
zPCInl=QHECRK|2b{o70A%I_FDUcCZ&x+&zj7b(~f3!g!xW_L}a^rcI*>Skt2jM|$k
zjaxc{XUt3qbnt)<g}0u4Zdff<K`|~Jg#xMNf>}pbYlllOtJm3PwVXBb)#lF+mn3r<
zg8m2w_`ZJmV=(Ckhpc?Q&T+DMi_iAn81BATujnam4LBGia<M)!BSo>+Ww;l$7V=qA
z`^F>0I3w>{31Ag1<M{3ue;8C=-$h7asC7h;2GiYp_p^OADy(#@swZS{2UG=XZV}6i
z36vHj_7o`P$a{Wx&>iJ78>7xbF62^i49YuC365>9|J7r}67n(3cLy|UPv`E&vKz~M
z63TC}Xg~Kw?}8Rb5DOlaqvWXlxU=AVy(ejrUD*U1KIf8eeG7N(=7OK+5fOWwdAc`m
z(lCWT2Hy=Vi(bU!e?oUBa$16QmEtqc?8l+Mr69d^x#}T;bGxvlUbAOd!)p3VJ5KIT
zv{Z!snoZyttTqMQqG6KQ^>*xYuU-50i%Jo_rO{0f7mM-9SKN+6Ux2&p*}4kbkbV9G
z#33&EtE9Els<l(0{BEwQq(~ZWQ;l!TFg;;?+uA{6{w+XubbTuSeyB_Hrc)E<F1Hd(
z4!ynq6!_A5a;}PPgydN}UxUX1^0e7p8UX08C=;{{f2Pup&1eV)G`76#5yWaWTF$d`
zp6Hu)WaSL<k2CI6b_IpUv-UHWU{@D28}`nZt@u=hl8OzNJ0Q&65|H<;-{<1sZhqpc
zT5md>&z~C$8|q7i>_?ulEZB<!M*PE7;U>2JkRywFh?`e?6n`!@+$wLEDY`&qdS-EF
zGVQ<?L0`*B>(ZGs$-V1T*iX%x`*6(#P{E{@n{&k2=;gsoV-Cn0p<Wjq_i7eaE;pBe
zCd&`2x%?av%fEDG|B_WCYsbXU^`-T2ev!Jf5Ny9ZzSiSs24JKUU-z>I)&dsXYN;p;
zbQjktoFhQtlUg0h{h!vM?+=C_k0i)Fo|H<xA|5zx-mdZ~-<zgvD*5UqZq|RjXuZPF
zUwY?!c{TaXu*jvaWOTJ@EO)Yxe*I%vFq5H6$<m#m>t?Q%(7`8TyGh<o&!3gvcO8n|
z#>c01>@K~8B}KC?+AGI>(_ewZ5Y3NoU!tMBnOakhx;n9=bM=#nhO)?lQrjyI(O?$e
zwtp?g6r^I?8Wt(n)IJS~`DWZ$UuA2a_6gowfDKR8BP>PAJ&!{d7I9_SEk`eh|B@ve
z^M}B+mzXv)F4o1WwX~hZ2S)D`9ojh@#-4|)3@yDZg4OBR#eo5`GGEA6@^ine0Fd(s
zr+ECZ>SvLa%!Z?+?+6)`W*VtMSFP7Oc?UEz>!sB{IVnTFS!EUTmsZu5yH1|$i`fnJ
z5GMW_SgUtFfUe>8-v!sS?59fxLhl+vHLYi6FXz6^3^se-uQW;gVa#KAqp-qwEoa9G
z`evMVp}M86S<f5*Y!ImBRAFOG^?pr%1WKmm!O!xia}>6%l1F{j`dZ`$wNBH;xy^p_
z{u%wOktd@3k6f%B`v3|%yK=s6hrKA^pM=2sk6t&$jn$|=<o2Lv_5qk^UrOQTM{4q`
z7~zaN*oImF6K(SZ?)EDA4@1{q+TYPll?JU?4;A6r&eblJ)v`O4w`XJ3mlk;5<a6J}
z-OcA$ztNaFt0Y%m{>Hw0%zyZ7z29fwGOj2Y6l8@M9B9rgdgG#Z;F^7?3kfq~@cUFB
zuy4ku)tB~Onf0eyp5<(V@1eam)#gNmC~`jV{cRZ0LEeGquqk-<^jT+Ty{L^gp0i7G
zvZ!On^3N*?Y%8Xs+AScCUd)N+lr!ityw&_v{gq|XE~Vbp2rP!u{tx5+r}(>{kukA$
zLT0`dEMmlz9_N(IC$~f2{8PpYnlYrLrkp1`a;bLfEp<6MWu&H_nzH+r+H%%LsCrfN
zA7uvzd+U50NEHGm)q8fM^h9q#N)j924I90mXsBXUN9g0f6=MAuG56EwF$F6A`-{!M
zULMPtcoLq%0}wg$$-iv6sx9TvT>I~jn3)usDT#06*$tX#PAJ42J{Wa|?N!eOsT#k%
zM2+1-y}8KdGKh=qZ2>d(C-ca#+g@9<Wy!^iK*^ty@=$Z;#VO2IoGAZ>REj+HQg@by
z3S_|f8f6VJ*~BgN<ebPPYh5YI#5c<)%iNxu??C9G6tBYEFUYATeaOWUMcMVb<Q(<1
zYP?a$^9frj3=y_}h8tl5v}*{TmL3?@>u9E&qbK0VPaLy@&{os!3F&**5DM$4(2G}E
zS4zpkvhBff(K}i4F_}M6Z?rAmi!XZDu#@NMjQ4Qm%@3x$)#C46OBiJsee8CUOQY1h
zjE)jhq6O*zGaAHRpKepf0oZjUS|A_vDEPnO#xOy8@>pepKCk3T<`i>T&&A_woJP^W
zuKaG0r-`ZSXW9#5e&Z&U-OXyptKAyWodyVStbo_U>O*W-PQ^L7pl)FloxI%1MxPTL
z=ssJQ*c?uo@to7hoM#5;tzXVfF5sZ>hFzOGyxg?gDotFMuvo@Kmp>moXrqzW!l(0o
z3Xmr3Cb6hdC~<Q^8SVcj^toKS*bVnC5f#IKf<Uid<Nw+qS@MXb5J6ZoCU2F+YToZ2
z3#{$Wdz>1dq-||gn2nVVxSSd;=)rE>_HU&L2&22jsL|A8`wmpj3lkU-^h@3*<+FHX
zpZcDtXXFS0OAXB5Y^~<KI(?Hd$s|)<sBt^mqM1MrzZgyvf{ixa1)7jX(aS1WEGkF?
z+q`_YJq@I*4c8JEO+=(cdj=o*SGw)M1dlFWTvxsozi!aN*S<I&-(i9zj%gg9Yz*>=
zRc%Z0*(_wlij9A7v!%_D?$sR58{J@xFqcWyJ5b*zI~ZmGHe1!CIRe;o<iW)%-OJKU
zkQr{6MUGNhR#w4;D%O#eR`DsoN!6U`gqSS{VNQ+46ihNMU;|aot*8f`K|MZ-p9z}w
ztF84o4|<orGrYY-%Kj7>HWYHSta^UIrOta4M-Re+TQAl-CuI+$0#7^*icpHQn?K_O
zae+(p0fV`+TTw0On_jByg}$Aw+f}4no1dGvj$<sNg|!KKF3)vO+s&l)wk5(TA6RB<
zEf2&6?T?=|rihZSb*1{3L%XGb4S16?yPKHmTi0hvPM1@dFD}GW@ftJjd_7M)NHHbX
z&NhdQmyZZpG!^m<3hF^6e8xS@w8S=xb@K4@-5iJq?ogE_-)28IQ=U`z@-sdqvP2#q
z%tq?#-11Ep5i&ssy)ap774^b+&URM?MSm>M*Du;cAA4Y67`p5?ppTV13rz!-@S*;;
z5N4fSNBQUaWlq$MH~T_{`?D1r1FF-u%)_Cie9(kP2(-GFSg}=af%AK5aOV4Q%N}zX
z{87%50%x1v)W#c=kwlPu`_F_05bul0LTO7ilvMWM0FYhi`xcwPbL-soi^aP6Ma~s^
zm68SOk2}Cm*XnsCP0?<x%)7AtnNReJsm#5XYE$I=t{6|rdDSL%l+eIJbo2r*kC>YD
ziVRA4tKJVQu;1v=uEjm`IN#4nfy0JBqK6c&eB$f)xEWBz!jxM3)}PqPe#~C@roKPD
zD$Dl4m)l`XD}haw#vVEGm82fpE^s%@dG-F=2WP8;xoYh>4qAskqoN!Sp{OcPy9ahT
zJh7&#{n}qFhH*P7!p?%u+jELGG{V47WU~Rze^426<v+CN4TwDMd33%xB_}+Z=`gEx
zbR`5KS_bDwcl%@9#>Uw8rU_ZJ)pk$RH>pq=*a#tqjW(4mCQs#NzD>WaT)JR$ht(xt
z%|96{mVQ|$Y`I{hQ*KnGPC-0IABxF2vi-^&&3<-aFxKC%S&zlGjD~X91=Kt0UKWZO
zWhS>&q&~ZG9ZUcV@z(q57lK)ktn-c<_PQkObem<ceO^=S;_FB2m1`cR5<H)?QtM6%
z62WV*TnvrC+5Swd7SglW0e50c?K0RT??4yLW;WYw5!bauW8!%3yZZ*su`BGjT*Vyy
zXEGR(thoozjIxY#wf0%Aw@-}1hLv`}B@hNfYQ=}Srj_W}!?Vd;`J46Adeb0=rqj%G
z$Til_n|$^AF(!4D8XPwN=VbEPpn~x!CR`Z}W^nL=+=XdwLouXTTyfSZ!dZcwuPwhf
zi8BjpzTphl-lsfh@44trCSH;LgV51E&KAI^uft7i3ZV{U8N=!ZZoW11+a)kPi3kj*
zi2LaMyj(}SC-!<yhqn%I%^xCK_KaDruUzF!GaBkzvC;Q^!rCX6jNCtG=$Af`tz8ec
zr2v%e_7fhF5Am{*R13m37|m&yM3W&Ns<yfBFWC0Bnv0HQ!+lZtG7vYNpnX0K%?Vp_
zenddUA2R=OoQNCJHQ_&P`0~y02jAu{8e<vU9OV%2<$V6}LP$8T)fD6C=`k5TehB19
zTl8*@b5#nw0=Lam5Bv%sDke$Sed@9`=bI14c3ZJfqa_lxHy>RW%SCLj#DcDOU#K%G
zr_L28ngakJKL}*ZOx5N5OWx^(ZhCXdO5B^<<Dk|<!%tfw1nqn0%0(DH4I1?dK_K^H
zJpuFm!Y$_RHCywR;=>IE06Qcjj)3-CQ=^BLZ8HQ^{cefo{RGWw!wKZ<{aBrG(BT0y
zaQP1qFG|vfLlJqx?7m1LPWv$``48AT`UqwB`56g^g6Uw&%cRODieITj_lSwVhQt=d
z9%VJNDy{YUZ4!{BOY!TQE?ta<i)9F1>|?TwF8YsesD{OAR$8UFUo3bTSuPnG(_<B_
zeth<68jH`g?|C$<1wjHB6W-9GS!#e;FgKQ`Hqr}Z_&QOs-=<Et>rgkT@8#cgbuG`t
zPJypkUg2LwkL}Gma=tkxrxg@{5w(B;XLZ$Ywhx)GnWB}Js9v=mDJ8ZIi=<VeWiyzs
zQUu`1`&_+P^L!8?aIAY9;oe!?SRTgPPok!2_@ZAN6Yd~=+eu?nU6`<yiMJnDqyuCN
z(0)QGnw#Uw?qti|wkCrWagR$qQ9<Mw^+-%*B=hsu)KRm=)aK{YUrUnLh33@x`U0yg
zs@2T<Lav$5CRUm+X+U|0RVH1tDZ<97&ko)6a_^d4x3E$~e8eZ(XSZkBR^3jBs8c&b
z357KD5xA3{nYnTBNvXem0ggy!J8um<0}pxyZO?nPVSc|%)Hb{H4PhP;&F4ZNzZj&k
ziD<c6o6@6WO_~f6UFUdj2Xx=cLURykcsSeS)4+gtw(2EILwqpdstcXPqT+y?{!?CI
z@7t-^lGld4GHXk%hA!)@Xe^{Rl^UWvLQcB`>9W}xv(sgj3)#*)KI*ct=3SO(24HUt
zU-K>8`>tLAAW=0=ujG^8Pn8EQ^%&G=p`4^<jVm%SxS1lq?d2%2@uDuAJzC8HU6l1U
zy#wkuWZJgqth*|K@96Zgv@C>&V}b$2<b|$YOZ)S1*jhN5NH)W4SQ@|KxN5Nk6wY1M
zB5FMjo0=@b%27(GUakY$%r)di?t0rU)I<4rU6Yul#tin#Rv4^=@59Liwqax!`?HJh
zH&*iuPpJ2Pn<l1J2kCd)ooM06olPei`WK53Sp}_i_R9C814e{1Xs&uP=Ay8q8Y|=R
zi;e2NeO{K8ByLNKwYBaeygx|&$G9JJ{=Jz8dZ|=w!s*80$mPN}zo2*GxGf_S$MXf2
zm^|A&QAZMZV->x}%+~9AH+A~LS5tc;cD02i-cc}ihH`xddZm@_dOv9S{CRXZB(+Um
zD{m%?T<EA~9JYk@Q_ga_3I1iV+A*9chxmT3NjJM{e@I=r+dw(Wx9&Y@#q#;_V&t0T
z?zT}!&!T;x&0Qh)5>_koOTRZPsen^%>bBXeIvxCC0TYOB^<JgCsMmV3_4#cUFZH#~
zQKxchq+0^Dtqd-6=*3FxP=f}Z=CbAsqMQf!<@USGsZHouE#^)<0g$4QHwf^^9mH#x
zXQlpxq-yhB))AU#gEhFbryR6HOX?+7^l?dRbHOF3D($@w<PHl=xs)q%E1gkU+WTs@
z0wddxi#W64X?-ot9F|{Qt?Q1F@sW~sl3CuQvb$k%mtqICWT38d1)lTzu69mxt4vt+
z@#aUukdOJ0+g@jZ0L$ecBhzQwC%3CDh;_bpJ4&VOL(XFeE1P<8Myd&0ptDeFn>b`@
z?T!t!PD+Y>?*7Z!=F_rT;~O>+gm-0|EK8`g^S*&d>1ID+Oy2SB4kOO7l&1T2qsPT5
z^J=+}VH{!Ie13ynyP@%tKJHuq36G_&n_Mh&0mCc}b0imGl^1xKD%{rVCSCD3n`Gmk
z0`ye5c}}Uy;MU`?L^8EpDC@|?<T`|S>H8GZV89~pjCE@YM+snTP~??q|8UgmF#@qJ
z6ud$w2ze-OxkVpjKwG^t_NDm4b`q5<rb1HHYpl1{LKirbO3dP+?Sf!mbTQ)0fn*U|
zx&p4S7HYHS+*XBsVkTo~EMh=E>8TX%{wwXE-g*LM0ewt(i%|kNMdCuVxvRQ#DEFh7
zAB31B;YEexv)(##pEN<^tOD59^4^}1i$>*HfnU!euXWY(9NVGRuRT75Y2C40m{V$W
z_9!8)-4yJ*^Q+#^5`$$rvy^m#vmJ<23%OPM0m37m<$?fU4}zW=9rgmLc8B+OkBft^
zS=qVmCl@o=5456T?Hte<r|l`GwvyF2gXnLDk`naD*adqPcma9umNH@=6gri6=Eqw_
z-FC(vhOcSUPC!L!s_|EyFtAhyI8SfbrkqVVfl|~{imvIh$KmMfYtOL$8?DmU-iBd5
zF}&8-pS%}O=hFHv%f4?$(fAiJJEtX)B|Nm^=9b25eCa>-&tfn74L91}vwGbn5}o$2
zlxVGaEd`4|aHp^gARH8oD7z9C+yal+pI-TiAts_zfo4&+#2H`iJoRC~$4P{F7d(g?
zHrfNSe2Zbsm2ly*wS2Wq_%)MR2qE+b8@E3kUVUYU=;VWQVv{v?5Ict4F83(E_i<y=
z0A!sZ{BG*kU$hH_w??vvqK0EKoGeDwx`C3OIkic`q1c!|Bbt~YVE|~?A<Uim+(OlT
zBjpP%tD{BCRNxAOQoe}}w+}D0_dK<VLKXbPeYRE&hWXPg_Pn2anJ@yIdudX(61u}%
zCqfZETWv*q|CG&j8y-|GP-$&@=ST|5(`;qeJ+m#CDH1Bqe4F}ZJGg1`lV}}H=VTrv
zs)_w9<}#X*z6ek(Fy&H$)t|_n@kWeSrNG8V(y{%A@o@zKU6Fk+(Rk4bDs&)P)>AXe
zZweYxx=NR7rRqO4=bGzz`3Hw93_X<Fg!?Z7*jcs{1~NE@?`4WV%a$fqZ?X0&JReS5
z?(h<ojm>{s$DVs-ExncPyAs0^keV{fuZYr-_Va}DrUWWh&Fr*uf=w>s9myQcB%9@D
zi6X)Xega~Njfl$HvS`>HnD=#PKa@O^8)^S!EI{o(8q7nw>SxnWIvLUZ-lt{R7(Cv|
z&a}>|#mtbiGjz>B#O4F33cbS#2Z;Jcg_u=&i%95sZTnBPOZGovGZ}lmgvu|w%*P6T
zQh#9BsKBr!lQ92s?7EoC>vlNMJ#zF|pA%F6!QhSd(XQp?yvqVHJI=96YV!2nobwYR
zQUB>0j>j;IU(ctUQ6Iy?f9~V(A4<8UxIg(y7|tZt&9(IK;I>SZ$P!Q*mPg?g*o8Sq
zHt&}UJ2ZK}O!p~;<&ojHH;{IIlQ8B|kEf}$VRzCjlT^(8fM!Iv-{tt-$Lg1=np4oF
zlkee;0BDuhcUkpp)eZJ}Xf$6-X=!R!xS0K(nR>~hy>?o1A7}r#AT}S5<#<&a1nkDY
zzX7w}3`{&H3^@9=Cfm}1%{id{F2Zr7WTkC4E@8LaA7ppN?M70QZWLpif;KEcN%U-%
zjHL!JvFA$g*x4|SfnsN&BAjk$W^e2PygrbsROhg6C%25b;kqo~;(JF9=z5^;Pij^%
zwSNW^D1Z3yla@6vC7<7Ux%A6u`=|{>P^~IIX79NC?PRU2Bb*=1g8KM0ohwUHsgzkH
zgN6zFv-PZV>1}tuJGqZGHzltVM`PSsUC>^<jKRg23%+$l6FIoI-bW9-RlHpO`2_^f
zpSBV`ma~XN!sDK--av5#>IRw*eQ1gWGKlos3ve68oh%ZE9VAtoLoW!r%P6WAsukt)
z)pxEGqk}tve?Tnk@Tcm%_?`mpEd`!XPPN)(aJ<-B5<9X$=+{MQeVou;Ap6F#%Et`$
zE@s0Tm$+&N8eT8L7J^7Wx(oyV`8Q`xIk*l&Vv_~cCZ0EJ+f&(}t+K`Z=IK}_h6>%}
z8Siv0^5o%PF$bLAwAe*96_L~6x!lzGb08U`=5Ivh)DdjLPf4U&u6Y$&*ll-quR<!{
z@7Y#DXW6$Hz}9Kf3j=#evWu-`IcRG7-fL?cQGG{(fkG|^azAV0<G(0eY4bAe1~@C+
zaXFxrl`Jc_qj~VOp?QQEuB?k$?6z&eTG%%XSNcMeYKH4Wld=ZQ8s`}NvGJOJ96H-Q
zb9pI0wssd>-cl^O^df{w@{z|yY%p%V@D-MhW<h}_Yx<WL3pnZq0pO_=-ZikHKoU@4
zRwcnt8AQT&4@PWz*QaQ8$3{;3BaN4ei-bEDYs16dgp(i87CRtzC3@A1bQaY|XsHK!
z$9b=6qVO6Ru$Pir(^|MjK@>_Sw7U-1&PxsM>$?K9qCz$FwWI#?r8Y8v$J1D_cMqa^
zjZd1Dk`*BEi^yKqnR2>fJ2pc_s*4A!mU<qR-!^)11@pj>%L%2fMQ!}sP&VqbA1yw!
z6KodCnM~X^Em8@qa#KX?ly5IhvMgSijv!W{B4#~IxR<*#!dWOycQe1whg?v>xKr`#
zSuX!s?_Msrh8Nl&sV%MD+zT$w2oMX<t3~WtOCk2ITjWLoek{n_LwN;XNcc?Ai0(3j
zQWX&XWLbu-GIH2PBEIPJ68>0n0YEta)sEX4^dHFE&g^Jh>&xBxq{}aC<p}6jUc~*Z
zN{D#;T&KqB4Nv>(=i&v|0^w_0EkDS>An<KR2xq6}#_h2<t|wUqk9Sru(Jt%xnXuNQ
z|MbPfU`G+=)V|B6CbXF>(he2vNt@im2_C%s4F#Rrbex`gSF=j2y2~Nd%9yK|wOr#R
z!BCxE%$gbAhlp~M9>%EeiKROO?;Q^h?P>KeRE{$Iw`O~&2WRD`ikJ#L#qc!~-Bl)P
zgqL&<imi)im5Fon6#`DTa@A+?Vgtj-zNg*=;)mp}1O#GiXhMy|FB9mNmS4Zg!#wb0
z+ufdpd#>f<y?V%uF^c5iZ2p=;$EoX4G0vx~rP-|M+!#N*hCq(700i9D=O|1nJ6>5N
zMf6`s8I;v6w&NJy3AtV}vO&r;gV)Ix8&n|{KMRg8x51y`5lq|1O;Xy1li+WtSrpaT
z4GvdW^Vb`cOI%A(PF)k`INOQ2JzU*;NRwxR-=e1bUDf1j&fM>v-?;gWBSaK+og>0+
z&o|zh<NU!a=kzL|5^H+ABcWpBEq`q~tt^3hiyvl{#$br&vXIw0s|exTXr`<ru<7}r
zBQhY*sGNsDbY#mPu&mbLx)5hpaLNKM4tgPdp!)Ih$X_>Tb?JRzNVY#yaOa%%&ktfR
zWMi1K;^~gFIAXBR6)q@+ze!4XioKk&d&irw;1#D&^r}1&XO6+=!Aq`zqfRN$e<+n1
zDpxXqnmrqM{RhYCTglf7Ez&uDXKX$lgK76CId@@8%ULXA`I5LV=CidCelJ(#b#o06
zzNO_O63}%vcMPlQSn*VXBOuo+4o@<_O!7u&@EblpteN#56U6>dH4mfN4)%pmoNi4h
z)px2Bi4g>7hUz*+XE=SDSya8pb?DC2M-7OG|M10Oqw9?#$qam+RK%OvdZvC}mQ|z0
zW;>cG7aYg?p73}wrt}7Z7UrKB%O@;+H)e5vrN|8D>hXGGv_#>ka-hW34{l*6W!EQ=
zu<3iwnXHGsOF(l$MGbR|7d9<jtunq4y@s~AS`-Oo8i0lPo+gJ&n=ggL641HNmv4ev
z*mIQ0cvPaxCZmLpu=<H4wb)?FDWdY^^%ooTD*ojLs(HX*gddRd9wBfC;YUchNO*Ic
zKQycb9+n*Cg#^uNmbc|BYn49G=nMiP)>>u4v0XA>(5OlK^-4^Ia!6?Wg)4m1ODcNa
z@8^)49xQFv!i(0L=%YQS*rmt1UvVfz^@Ee^<Gaw?Xw@rSuSm2tYkC^pb|~L7NX>g(
z?5ih^G3A-%OmN{o04NMyz8$*M>t2dL@vGr@LerbF{y|u9J=~kOcf~z?Y9=PCaqT^b
z&7=sUi(gF;Kh@a+2ghBOIR8$5`(+iGC1Bh<mEF+Yh@j4H@qFoLdL?Z8VZKTOKKHw`
zul2Rb2*_~7hxpE3=d@S8B|fx$UJBD-!(45mp`kD&sEGhJ{k6pK1h2WN?-PVEm&16U
zMyJ{#<q}JX^XcZa_?tzdI~Mx%sMrRp_Ia(^Diwp&{pkz9)8{11`sI+2H_=z~c&d>G
zXouLyIARk;;#bG3(Y@PZ$_<`$yT{e^%4zZilMn2Cy*JU+UOI+DF1`bw>mq7>rr#<9
zVADLPy6hFbm<vA8%1+}HwmP>t?z=MHHTQ?BTj}>{AJ+gaHl?Su=cs=cI6-BOQHYN+
zNlWdN_oGE~JGwh-2b~9*SUGIG+D%fvZ?(Z{X<AvKvg+YommWtlgMI@bsGS{$_2U`7
z4W_>L)fG5t2_H6|b5gE$WKhqiu3m#ftyzRm1k)}w{rMFY+mlr|{}<y}O0(<d8JB%Y
z<@U)2GJQe=-D9b#hGw}ZPS0S2SiMl<I?%hauMDayd-a4cZ4T@C^qf=G-nH5%y2trV
zuE1XSSiY>6yyrzsY40ov&F!EK;NDE&@V=~_W7213o$bX2Kl1GGijR7Y=qD)2L+A3%
z-DBLM>J7YN*6~%x<bmDyJXRK0`_Q9A=~dj504-^c<u!T3xX%5cvZ$atg&kkE0=JK%
z=ORVeZ~(i0_5`^{PodR(s%FsjE&3Ja5<LFmv-Ta0K1$nhD|pS_<F4+B;bdB68QXv2
z#s69?FkT`Po8|PyGl;cMhLi@yuvwbsg9{Qz88(x{8KM(;Es^&Kh^yp=puTZz+yxq!
zGu>662w(^oCS|6!wq<uM)<Q!w?1CxWll9C1=l5E&tjUT=0%^P$V$D{v-PVb;bI5j^
zVkX>s^A7+}$?a1w&C@#nJm$i-QH2+a+2=(h1?JazAO<E)UR#YooX>-E+QOQ??bCx|
zEE4|Mf`is=niVfQl(K#NoC~nr92%7cD$KHm39|*Y868udoA1Q2V+%`r7y;P(GaXO_
zh|5$v0MM-OWD}3`?;tZ0TGV8=+-UigVOP_w`JI&=o+w<Tn`W@Nc@*_5krKMVj-7e}
zDEXGvA{eJ#@I$keb-O%w_xU+FKdo0k1p+pqb9dC0^EpbulMR`!tNT?h6PEf_)MgqT
zBT#NlPPKbbET;E1O-NsEYWybcB+yL3UI0hf8#m;<)GkF3ge8}@uV_)!4}9W;P%+DE
zh4g}cvWgb`xJh6zgXL>CW}Jo;E`K^gNIS<l^Eu{UNPDTln0#Exh;iymX|26-bkiqG
zjy$ZsY>I9+L~DXntk8z;R>%F)wfDPIWrfQ3jZ6njz>rR13nAUFg4Zg}ps)>vI>e^*
z9C)6`ub_cBY*q<{PWj8a;=5taVmv(OUNhUCKtA9FgK}vctv!tp^)$q5PAty9{nd%F
zL1j8R%-|j231(SLO#vsdzJ9uO9KvN3P|V9;n#B>$Akqh^{X)zRkrwdR^*3#4{AjFV
zOlOl^3oGU!J3*fn^qYUTqq>XxpBnVPc`2gdArpVu;k98a3Yi8;Rmnj!NpVtX?Q-Jr
z!iqWs#)?(jv&Laad-=*qSca21{HibhvZfCoYS3a!^p!`=fKIw!ik#iJYNyJK;r)d3
z1XR0kYA8DI|1x~)^)uQZqP`n!I!YS@29Z&XWu#$z>N%NnEoL@|4G!s_#4<Kfh&tGP
ztjPb2L;s3bX`n|koU}Ay{EHRipIhe<@`(7U)#J{IKdj&X0R;ZAM8s+}z6tm<Z@>So
z9j^`%Z}i`f`Y)wWBIK#w`OSAeh^7l&Pz*KR;BG}|d0(GetVXu}t(g6KKtp)sOCK$F
zq{k67ye(;XmZp!_OD`D>fTf9gApYOPe8#NH!RSs&gA@>(<7l}(YYOEV%3qH_Bn&BZ
zlm|@7F`4lDEO-mY*+h!R>2@zBqucT%lWAZ4n?yjC|NLWI%F#OcNm@VJ&-y%%eqv~A
zVEwh6<FR216L#c-ZRcV;^7A4a#W9yVPXq!P5q?Iw9^1FjWpXoT(m&vy{~C|~98xHs
zkvypReXazv6cffamTjV+!KUw8K92&J5;#BsxukC;iLCzsL;bt2&=6*6ZEvyZt4zfu
z^>8#*wW&tCwMXp)O$=I7(*K_Ck7?i6^gj?<ZAG?1VwV{l9}(g5n?F%zz+t#;)^Xm)
zy;nxL7=JsPQ2h{f3BUD99m$bZ0=9*&NXuSme@`y;*ju;0K4{K~7M7K`D0=g!F*X01
zVA1e=<-xXUh;@O{z6I<xvdze_n=0s{y+0?9sejsylR@z3`oKRs6J&*Qu`fo;`(80l
zFhMzy0MUn5hCx}GmNMh^<NptZA4I(5I+YDF6}HrGGMQABrbJwKxuN~>6AVIua{n>k
z{U^s>Q|03wW}Rai^5vg0&mjMeaE$$qxOBcS+W4E=K1LuR7NK3xF5zDb?rRl7M2PL!
zd`JrFzf__>@)H>k;|*e}`BVljQ~rY!)W6?~D<Y<M6&D~3=dXE7^&Ars{Mw=4F6#R)
zM*Y9zf6;gl0jJ{gjZ*@D%_84-h!|wP=N?2iX#XYBUoq~#MEd_JNyrkvhQG@=?WFlI
z+9dNM!Z0(CEO-(z|0Q8~#3+*`i{BU?MA9>5BUSq1Ia}4x-2Qz4Hc%n-AZ)EJ5^oe-
zO3@5NAYeCEzGm@T1jvHp17+OeLwRM^pWgX!zk~SaW)&vc{||9*0Torl^@|%IAR;M<
zq)17JbcrA+DbhL862nkKhZ54DAThLbcMlHI(n`ZH3^jCja}Pex``z!}`@a8szq{_c
z{%g%*&Em|Qb9Vi9oW1t|O>u6$^IQ(VSZ1DFpXk>u|HfyglZ>tt8OrD3<3;?y28+LT
z0l+F(&@8H~rk`q8TD|B38qh$mQ|5z0tsbv5imUKw#@E!=lxD%yw|s3U6oxE&Gq{`1
zlM$?H;*O7q+w|MZNl#M3*1Q&uK9=gu^dLA4Ys5FuzMm}yk`>$?mv%Kt{c~sysLqFC
z^=mF)dme32nC{#F=JJ9nEc#wdO!p|f3?u(`%#B!1lY7T5`NV#A0bOOkLn8Xvr_=!P
z0*{nAs|u3y<w!?ldSJ71Lv|^2nE&0ED10?wgb9@~V_APaG_z?S@>FqA$!_m)GylzY
z{ecJk7WX`!{HFTK_tLSOA+^@DJv5ueloD$lm|3rG{rEr~%Wk^yb^R{+=aDPuJ0ZIa
zrH_XW-*qdOa)9|l&!XzzQ3v_DF&(sfb&3IHHmb}h<YOV(u4txgWvVf?^*3BIz=Vu~
z%%{lDu}Z1Jk&<i=9m6NaLaTo=Z?8}Av%Og+ZQ!7l6sDH);2B0ltPA2y9y+Yc`b5o&
z(w%tE6p|lTaL1O3*_@IAGq|;-i4VyRW+vYusIDG#;HAJ1>3vR?*v#C-BqAs!UWEFU
z3=&gR<BAh^5T-OZyCT!3CV__nS&#j3eifD?NM<{LhUp-nALSJ!%wZS0Qp#WeqSs7M
zy;*7Aqp-Kw>+Ff11lqIo%ItZee>zeMNnXJpW=|Hl!EMN-sA{Z#f9>`%oHQhFlXn7O
zIP>Jj_Sojx?&D?<xWgrQ_+?IqEBdXYgS5kg-NincEz5yLwx`3wxbVYZGDswilna^n
z+pIG0JKzY2ozueQFOuoU>(=%e<8zTI@Vpn<)>?(kDi37>@x9H8O&`x;*{{nc8_U}K
zfJ$ayWvaM?4w(WBk1j%O{5=H`3Rb8?%R~v5g|KE1sLgMjxzvN~c%zIb@{xlxk6V|o
zCzt7^Z%x*N`P;)N2DFo2O5DL6w-r47rsDmy%JIM!rY}3ivedgHNdrvg37#K{fiF$N
zrW_lbt*j>Iuz?9{;<cftLpkc5DyZeKfv}<NZ~o?}-x#S2M8V%}u3WA(EhUN^M)GXa
zXsu$U{I}U(F%aC=I!^t|EPr2`idCv#r9!csw;jfA0j+4jU^qTDxf01XM#itpCBx41
z)+$4#^N!b(w6W*o(7q(o6AP#xkt-??!>;wVRZh9s3>Quw%38ba)Y<<Ge9BR1_>Y#<
zHJxDLo6wTE#B26gx>*D45g*R5p!|zH-r;}P^XfO~Llm`SfC3q}h4x0Der?{b&h`cT
z-PzVVt;*3fDS5Sge^0*JJ`CG0))#cOUO2}N%X9A$<U`n{(B&x?lB>8khI}YHJ1^`D
z+_O+~q4*>YWJ8o{n|lRkI@$wMz_9oi5N(<HvmoMDpKk+-UW*96ELp{CwJ@(e^Uam<
zd^KKmLU?*{)aNYQ=nz3F6uIx&P7aRriCzRoqH*qDzRX6PMjMep#(|+?8Kmp_X9%*=
z+%pPMs+Iywly6<p+#BTdX!z+iiQ%^#7^DM6lhH!pxQXM+yz>(&=hI<j3YT1^)aUr^
z*lV>BO^W!T=O=q=#%hsg0u5O0`Wssv1cj*6>H>oUu~R3cOKdFgB%xC^IV-y-ZU~q-
zS_XPs+b%ylEqI|<W&@=J^c&46zq5Gt@8nj5k#l~5=K8L2u1;oWRugczsebU*wD93>
z!#Rk4xwl+6h%sXV$}XAOMh=%sZ=^cQo9aShauu$=?vS?Ss!DPx1>Sw|HHK(~Q~FBc
zs^PiAPG@<g^?{yAQ^Z8ONO$Z(8_*K@{+n<d35$=vkL?>(0nYcnD8r?RpygG8wY(3)
zxxQNK>hO!D`Ak>zC0~hpkjv<T9x(GvX3}%pdbmvT0=oRUF>aj{!K<FF^con*i*Mv5
zj;B#bD*>?L@p{ANBS;AW1(!kAbw_3BLRX$$ik`}YNNRyNE>Jzg*2j~EZ#akE^{}n-
z_KS!3DYmF%papEMPLyNo+eBJZ=1hJ(;ez>LzCJLtRF5xDxRF`sFfY1sKP|I%Yy7qQ
z?m`AI)H#v8w}8-Z7xBq-ldN~!A;Dbnq#d6<pN{VcCT{KSA;r2+Bl%W5tc@Z~K`0Zt
zCiDxKc3wFT#Q(~o&2<u}(r+L#<<o7a8Gs#yb(i9)oaI1DZWO++tZ8Ssb5Esb)bz8<
zvCr;e_czg)eS@EVmubFsF=Jc6z{#6MC0M|_6WZAGIj7Jk%ub8;hf^ZJGJxpD%k|0X
zpksbF=!Ny0rpO`hgw9Vm?=$B4Ujx|xzJ0e{Ws^(-5AKzUthb4u`JUpkHKDjNluNo-
z;6=Zr<vt&=6k}0%_S9$76|-v+BrF#nYRaZNn5EHVv~h!JwSFSB7O3MY?w-I^zJHn%
zagQnb8Eey1mRhNy=ti=aV&b*uZWpwiD>Rh#?I>W&Ar)VCi!PR~NiFFEcc39j+AG<7
z`<dl@){)fZsRSw^yYaysU+qhj@Ai)ukI%y<+K}4p${4k#xs9UOc#1?p2-6-g?%x;3
zq|cS>7$|u;?6Ng20q4`fle*ci<8_N<Q304N?8^sf_=c)xt*;U@l=SKYT~zuJiPeU2
zR8qznhOl==YK<epTVuYTdr%LAGNK<W0d6|ZfSeHQ;%?cSI3LY&^z!U}immG9*+4h9
zr21F)dM?RN8omxq^s?bU0BJD}C}<Y+g!<$ef=c+Ew51QcOC>K1Qs?UiR8vI3+GH1&
zl{!y-E`?o2iws%L__U|bYp$y1Uqd6U71MlfYiPW=YJm3>QVPCsTt!0Chc5Bi$zUBz
z)G3eoF~VG#{qm=f%(O(2kw9ED@wPeWdeCaU6^wK_F8L_^CPrxNjz#Bunr_2gCdJs;
zl^5w%idvX`)1dg1<GHi<M&#UD>)lvG-PJZ@7|C59yGdK$E6PcqR591-h7#f3GxMMJ
z@HsDKEdw|(k^)xe?rbD(QGH(5UsiY56g%p{j#G|FlL^Ke=r!Dy1^Q1)uHs5HMqDmV
zp)gSJXDu2JTBAkJ?Pa22e!MjKVS##?PA(OA$tILp8D<fGIMXacB_%JsI}df|_B;)b
z1))?i>~F?9CO??I-=0^kNNsMq=cIHu5!#L%;y;qQnyPW*0+n~$p}&h*Iy46n(oMSc
z!dK}ww}3?mlOs{Fd8$9+Cs_hed1&;P(HE|Scnah5G2K-w{9qQ9<SIONS+VkX?t5%`
zVK_^c#MZ#{wyoE#1sqGL$z0GYEHn{r&r3Np$x+}c4x%0fcTJ0cMC!a+a4Xq54p|bC
z^|*36{UF^m9-tWqUMfKe?u2A$#@7lhcqHAj(%o6S&~9u)YUCQeA-sPZhp>F41o?b%
zB+&4}Z4H>LY80jubsiT4rV+!Q(uuLL8ovQM?G9U2pzH3vXv6ga6_%JuIvrB$eklu&
zTicX%x}fe9syla7?7g&|rxHHcHd+`W5hQQZczz{8;d0@=e%*iQu}y*C({%j_LKrX3
zhg`MAv$|L{H)N!_?o-qO&%I!DX<NsWE!=mmd-EIu-@LbDJoyXLSO82@NI#Gpmtc}5
zg{n4l_Y0lZs7;#=Bub2tSREhVwJ?tFDqLgUV#lvImB?F5EuR2p9>MHd=Zfwn#x7oj
z-AfLF&t^Q1qe?LVDcaf9R%6W_4DjQYUmY*LhH4+(ETHyjRe9Gnh#{9p9DX7{mJF$1
zV`$vgwx;CXmKa|Zu)(+`h=M;wY}E>10XsK-7Mx6<?Zf!Bu6BCdjh3W%AA{Z}5r#TL
zFK5cR5sl@?d-bw}s|ZaBmy?%Z)TvZAU$4vbdEl;*%SOXN4ciDJX2<qbMu78$PiPv=
z!H+xos}JYSX5SHn*0LDK9~nk~Q6HL-PUJ^XBt5!qm?hlNcgKNGqM(a?I}OBd${Y!E
zF8s=<l)h629<`%nZlO6MXs!yCDYD&!j=$-o%sAgvFcd$|%E3n%$Yt*+KlFp(=1IN>
zrr^Lof6c1+lCmh5BR@9;i|H|MBefB_bNJX&S%pA@=_$5Cb|K$L!I*}c^hKdt*g%_Y
z<3O*XuiH$DWwR_s%=gj{cml%R?`5zf6EL3yG3PBnudlYe<3T?=@!SqpH7!n3+f=`Q
zw27{rJHFY>o45Dy==(g<u|)Mi0?k<X;nI_9{q$^nmVza6Nnn%0$8FY){6U7Iy=zKT
za9Ph7t;F_;lJ0$Arbk7!rGgOek3$o64X+*hw2cc_c(dU2dH$lpp48MZ$j@;6yW2`M
z)8dW@?CO|$uuP5gsflpK?6k>8g_I_mq1=H4rXihUO=$|3dZW&>66vOU)is6PGh<@6
z&KsM(-_G^CHD=4(%pQLwi>--+A5m*}k(q%hwfk1sCa3aF24|Wp?A>q9yfftk#|F;<
z$x-1&n}EBa)m-bVpClt+Fi|nHI=sDNQ%9+aq{a-75wsMCPMW>BWSfp`q;`$l3UgDc
z0Xk0=b`O)Yj|f48`#-drS0%%?%!zLW0i}>1D}^8I^5H>Ps$$u)EhqRCx)a0gnU-4!
ztz^A7arR#2&$kI~Lch%72Nz1IjQKYZ)l~$)BTifU#rXhgtX;eP7P{Mq6+gQnJk44t
z-n?JvRw>*bhZWiA28s>tjBB7a&;{^O=qf)<3jSP8dL;iSLZKCMjK{i0OFndvUUc8k
z+c3S~;oN?itxQua3jYEd?{vUu{9viP74*>Fce`HIl_~vH&G(nXNLn-5(xxaKv9aq$
z1A$8LFa>=iH&F^71H%-S*F-##OA5RhX(QtnV2GIxEhQ}Rt9a-_re=U4*cT>e)A_7v
z`ek5ZHEIj4BRuGz;H8)|kRYNT71wiWdHKgQVsUdQhI^L%5>jz`Qt|H5iRc}^)`@Tp
zNHc_`mA13xd2;i*ehjTRGnbABH7pNM5xJ!KLfhoDyQ5Rmerwu8n_5A4ws{v-h|>6=
z4NBVNg9h;pX(qFVTer=1ySWzqMDi?u{0cBUh^@Fxp4kuyBk-;B-S-)usKDl-!#6IE
z9P2R_aRdrM5eApPE!H+^Ngm#4QeFz<NSm6d_@KJHy3oNwquo+cH~<?)vRqc(ZWhAQ
zkSfFA_>ycMvsf%u31;c1+tWEpE&HxAC;E=$(kKAKc9ve!YM61?H)S~ONr8qISpmCG
zT51#Su2#M<$84&Mo3oQjsvOJ3(OD#v7o@=&NL&u6-c?JSe@gpM@#;-l^qxrQmGfFk
zu4>vO_&JI`EJSC0ZY1=ST8&~hwu~y}Of>@ROD8tPU62+lb_Ydp`^+tzs~H8AWB~4y
z8~5u-EIY{ecVP9(#lAU+jhCQ=KlLb4)H2{;l8Dw=JB9RU19|1uI!OX|ob&v+Ouudo
z2g4mP1?L%l19YLpPQO45I}$|=N5fmDBNYm!?5g)0%GOkHXDbXMrL5$)Q$LVo93zA|
zq`ePvsBYy;{%XP^DCWY24*-O=Uq*}^YwykEooQXXtZ~fE^`*(Hw5Sa;AUq189j;eP
zsogJ~I>uJ!!GTKNRUX&m-VlYZ*v)POCSvp%zD8GQ!huBw6x?o(7=A?R0FLmSzDUK)
z%WuhCGQaZuH!kXu07GqZTp|~5DM<}<fXkOzPWCmuO(CDmwc}i_QR-6WI`tMVspI;)
z=N(!R{=b+N?KLHT&5=RKbA|6w@hWUKHMmuxpDs2Fy-*->W?B!Wtimi=ho-P)(w4ac
z+1$kMZ~gKfbai@KCh67@g;Zv-9Zl=V@U_|bSJ*%jOAhaC2X)?u*zAw*RH%M^Ab^iG
zB_A0#nJkpx4`1_=1^RN8sBbsnS|EsAXu6K=Q1RaRC1OM_GN&x!f5BIqqmcYf{l+~9
zGE{)!1#7*>K_W(9v(`ub$YfP-%}uIsZX{t8m?#;1gO2lf+T=L$Na9hCF=P6scY;J(
znmG36?UA6<+)Fl<kWZ<rZ>)%1HUbS7`7EZe+&5<sGhNFDsM_6~wiQyJl&m+C7X^Ft
z0N*uG)`Jt~>{{I(`}67pbV@zeULGEcqn$OIkqWVzOF6&#bt8PNnd>W%k^wW1fl8*^
zDWAd?9=@_y#jF$x^x&*#R``-^=5s>c>k!RG{%#7^0MySlJ?OV>=Pzo-^IcdPbU`jd
z+1;$h@jWYPyoJs+i(1fzL|G*aejKP>9}nK};91x#M+YC_h1^JNS)t^ZC2tBRsWU#w
z0Um3BVP)p0V%gzw^U+9Owg`0Mnly@DtfNrei?qXBB<(H$FM)=>G-6XYtK!*Hym_i~
z)RyyF7Y~Y>HcR#ZQxnK}AVxcMD)8L97`SssxiIcCl9m#0x=%}!=>dlFYl51UBo6K^
zTn~n;+eXIdyh{5J3MX~=7RE<|m>x$G5Q4T2pCgh7r^ZcPTGz8gk4BJK3-H&;iw}>d
zI*>C`+Mvh6i=7SpHxGLX9*Xu$%qHklO56LOSY_+!elM}wbF9_fHy+a+$Ltg_kDJJF
zFp;d1!>ub8fvqc|46$q7-X>69;s)B|1dPx8{Fj$XOhjTT<2mtoapnj2mRDd&O`{r}
zA1?)RYnM2f(#85si8wei*L(mtDv^M^Z_>>(=MAxB9=q*Z@=ax!&FDy^oxgK+7FZ%Q
ziqyh|i&9>31z{L6YhU3VL|%3a6XI9ej(EOMTF>?arj)~%B0pX{-2r<2&F~^Ix50)x
zS}k0)Ak;AHl}WD*fbZ*UVXoSc?h$-aT==3~kk6%F?WIsW)!Vdh4ry!L@ZnZrsXX>8
z?}A%C54DAc<~vk1e#fEB4cDtlGP_=w(TLsUmP+0(&-V&(@*HQ9;kg4T*=xL772j0&
z`ZlJQR}2?^NymA)tO!8EnLy*%9Ry^~G~kLlPzKeYN8u7nsK_<%7F9gOW3R`94_`%u
zlqPN7@(t~!UKOylHD8gkFAH~C>P%YtGIOSDZVv<|>pf$<wiBnhBfh8Z{k(Le5~Obs
zTJ=p+cniQ7XjM_!iMs}2LFtL)`0t8SV8TR@yj~}3K~&>S3m3lSwHs&C_Q^cKq$w<2
z&PW-KYaYEQ*))e`CQ>I6s8Rbjq`mDVfCLSsG}Dr)y0&n2vX6Qhj`#y&X^#VCR7x3k
z{usmEd~%UEmw>aT76mx)yfK!WC<dlSJNjxhGYdb`L}N=eG*iQ!SyqyBiX4HxIQ@lu
zWzcVq_5&<DxbV>MD_<G-PvM$Z-@joTPjgjl!3ERHtE6<xEnHF9C{e{UU`2bhTu{2(
zT1zp>jgfW(3Nu&;yRmj(Lbp&xcN*`KW*U!^p@&4-v6(0We>FyWQx!_<T$Dn$Ieen(
zOPmp4xcNj9#P&NLVjT-HQW+|K^UJp%04yY3XXL83xpzk7&^s5>nGL8>ZK}y*Z9J-V
zA;bD*V>`A~Sb?cb6Eo}RsyKOX_y{8L@<1N+V%&Q=Z1%h0Hq;<RUk6uh4BO`<H_Y%<
zMi|8Z^#MgZ#uM9xLj7&8dGp%pL%^D}YsD??BDs-n8Ol&}_5iB6<7uc+Q^H()0rfF;
zHV3LM+2f=DA8w!`WGCXi7~Y<^<qzazAEeH-FIvVTfjufZM><nN;wNz)Cw(W!w9g5x
z9l2CYe}hnTdv$M)jDRpX3?UvLJZa&)3mcdkE}vBx$Lzlhi`TPF_`<bbp_A9od-|Q@
zh;&I^>A*B_Z6SR#cQ_umA#LF^b@NHn9MGQQ6*<ezebU1c+rJJJB8_pbBWtPn!pm73
zf5$IBmqahJ>1~8@Kg#@wZ?U^K4Gw)VJ5xUNRlszTbvR=N66$taR<r5CX!CuA+3S^J
zph(y=3LcFdNaYO#=C;AbM{82Sa^a6mF#`#YZ*Kr4R$xe8^?H93FeN+m<ED3>(#l&t
z)k^Z>*9K<!kS$t`%cKe|iN@`*Z>@}WI_CAjny2w>V<s=G3X1{GGZSDm;VY9<&Kq`O
zA(=LBMy^9X?jz$+vZt?f!hU*?Fur=eXQ7(wI^D%OBy@=gu^ujZa<<;lr_ZMftPYDI
zIx<H)<($*`Jda_H%pET`>EdfXPn-Mhx%5|?Wy!8p^|B@Cvzz_rwZB)jRq_nyk9`Kx
zc-0t|$jqp_<ezt5@Z@g!=CQ}a+*7AS%;|t-PcgtEA@;R`Hwfy3l@Y^5V)6sV03)_N
z=+j5zO;O>kzOyX9fF^O0m}E7eXFN|oUd4``M6&Ju@UnwO)+^&g9+$7Zx&01a)YMWA
zZ#yvEvHp?NBFs^Qk;@~Q?3x8SMmama%TgIXMO`#l#NCcRS2V_}7Y`aZr1r$}2UXK5
z;ZGYaop@a;2eL8JYBAnH2)*JgArNy}XD~u|orH!<IqcK7pI*639^qgI4`@@3mSj~~
zp{rV1Xz%7b#c%F|N4kfr73Ja2irnOX(0S`N*t$<PUD5X?N(SyOdiz{087lfeag{A0
zFl;zr<aJ2L_S=d$#4GV?>K${xOp$OZsGDA@*qs6%M7Sl*?HRI1QurKSiYX)?6Re_K
zZvgv;!hjB8yLeh9cA(Htzw=gOlf<bz`NYs;V?-Mx@kR8Ar{_y+&@cAVMw5+GU;z-Y
zOW^SsgexA{cIkZlli1y8PU*C=Yh}pt6>da@ZG-dUBOR|RDk*6%_l-rYNRTij4kai|
z+bnj=X0#+z^uVWz{rUmTsM9Bf<*60R(@kW7^~kAV*?V3An`ylgrzXUio!p=4l@hd~
zQ&!o%9Mv#it8B}@Xjn%$tx8u6Q{|i=R2rpSY=B6Z?n-FJ*cCWEVsZJa=x>5iAHcA+
ztQgf;3KeL~QpMU{NO~Oy^EDlvUs|0+V}E@*1lRH?<6@moJ>*u)2zchPz!QHIKb>6Z
zM)iU^rvj}}k;+MZmiu?5JT=k3idF7M?xdy0P^EXio_w`;Soa1D*lC2)XY#3Rg9MI?
z4)Ja$J+65%gnqF@C3^TcQ&M`&`)RfHkO~4b4;H?2DA0;@Jm2pCaKBaM`S-pdH0>v?
zM9z{4z8AWId9@Ym@-QjTkblLvc_B&7a}6%6;e^?N8Rs?4@3uT#?9-8H?RmAiy~Dh9
z72_E3bt;uKrr0RnOE2HmD#~5q-xr2J)YN-&{37__O&@qkM`NN+yJ5r`A$8U6bi+YZ
zZ%&ci_}zHUz<sADzJkU2vUwiAeFr$jFTB_DBxgWS?>U<UyPeD>z^h;Tz=5$+P;LGI
z`^b)3_N1!|zb$*AaDQokpzSxz!{L)Mr!m^d*E)naH;26O!cd=8LYAvP7UNGS7&b9)
z*DpqK>VvxpMmHrq4I^(Hs&?Cb3}CgmPP%(DnG^0=gc)M{9~tUi<?j(*@hR5aaXx|_
z6-_v86s6YRLkEdS4zPw9N<w%+P*6@yGe|8()LTvfr-_*H#{i?K>37u=d^PP7)V^}X
z11?{Qy!d(3U``K1>>4F=MWa~sZ@ocH*t=l$v02iV2jTGT0jU8_r<0Qw-ZG}AQUhyC
zoIZ=D6cMQ}l3ZvQA&azzesjeguv3hsNR6x|q8F)-yC$MI(hTaXcv(FyRg~#AAEY-D
zi2lhkqqspz4p&pEj_O@3J0NMonAv<3LMtift7q?yQ#-J}DojZzH+dV~7V;EWE=arg
zgqH_57@sI)K#bLDkdX|if$<0=c7|_5Up`gO`5}x;$~yon0X045Opm$SQ@8x?U>znm
ztg1;4UoFI{@v|(<aN99T55OapyP(0%AouWGA1)aBFj|ZTwy**_B@b4yi1EhYa~sf9
z8{%7cffcgAj)%)f9AgHi5npxo&9mMSj>(<)oMZ@pI!+BOwnL$~(}dllRg#bOsV%v~
zxYKq;z=|oQcL<ghLGhQ}PbD5c3HZU;6kr_oV;_>8xzN>W0e$MVGKgW<e)>APjqIwO
zBIOq#m6{x6{RSb7E5NIPp#%j%z&cJzn)B%y7-XLx$H#$=LMZ0<cYC<i3N)U6ugJob
zzAiENuJAOP1we4qph<E`)efR7BQIW~JohinsW;F)Ms;p#lJia5E%=8aI(s4?fiOOj
zO5>t+fD-7<aaHQ@_yBZov~vNQ&sUtEk^X6eptmNmCv(ZPVE@e~f2)Nd+<GLRI}@tS
z7I{*3|N6P|B|ZJ3NP20H=GUZEW`nq|=ezh%cXyY5x0H$j^%$cZFme}8#&PjG=N;-3
zyRneY(StMWKhL9y1g<ma#0x*Izgj7PU5CJu^THv^KA7SYx$qh<KcPSSV(t;U-L_Hv
zrAKt*<GUyH1~)z*XN_*yUGJV_(=M11q`@=3UIA{K{2Bkx{r;c^a>2#%42!>eFSbKJ
zB;>=|dRO*M{XO;_W?vY^zO=X^eJEtiaIicP<n|&KSjjkaBv5eHL_E%L-DgtwxXi0v
zL9gz8h=A_Hw89EYUsa_zy-5s~xLtvC70#`5k*4h@3J^vG*-W_rrQyZLV$pv;LjSP@
zG_{;kKV`%ER~-%4|E~l-l!ytN{QvAC{Qv1p-mhk6GdrEPE@eD+7o<w9BS={Uzki*1
z>A^dVZ`Wh!W*?$5b&|9xUcV+7RT!W>*Qf+(+9l5pPn*)L2<O*5id2NZKgfqV&u%i+
zB3)xY?_w7AbsI9ivbb|;ckyi=#UxoZU%qr+T-2>~H(+Xn@esszX(isx=3Zvg?SQTK
znCr(61(=hr9G}eF)o!spmMOTWvDfox9}@(sQ;2i;*o`!UD@Q_N<{96t2~NZ_uL*XE
zy@_&<*${L$NGw7wKs*0BzHxt;_kDD27w`KDyBMW6wR_;l3CHmvU3>JWgH7Ie)0dbC
z)6S;Gl-k9nhd|C@8o~MU!wnFY-Gx&;u%1x9+@yWKAcsXY^;Z+n`85XeoXD>0VQEAO
z9jZ;aIXtyc+FHF-4emXU=T~!ypDXEV&<!|&UTK6r5F&36rfg+r9=P<BJ3sQSvF2(w
z^f`Wbj(ihJ$->;eU1D7!QT>~LXKZ0!4mcF!-9?xWmanA{$GXprR2F1F@@E)9J?qF^
zZ^zblxg=4enLA&nkAf?>l}EwRuIaRU%t-KV-80?VuC>U&jw5OEOn)&#VoZOTp_pOm
zc9xk$JUiT^F-y|>*}i8ajTb#sosquoo=hDNe*%r<H#9U>Ja3KJoj<|qcz6wy_L`T#
zT33(LeJO?HWr5sXD()+3!sW;9<Z<6;@di>QGTl@`=`CG%g&zp%x<+w&uMD=blkwNM
znp9b5ZNMU;zkd#xT!Lh06rpqQ^#<#aORRDnkdfb?*=%1hDqlFVJ<`ZY)6CW5nTW^u
zlssqQx~quV7SLyf%R+L0KHqB?(CVx9`M)N1Y3a^CBUV2{nvoL#7sl=JB3CRfBZLYb
zN!wA$XPHf4qtTmCGl*~-38zSH^jv$?64{n=TP9A_a^Wyja%e&kytyEUOw8!G?fuBF
zE7}YBC!vII3r8UnI}ZYx?2oZbHM@p<(|(`RS>$W3jhTTg3ctt%{~pb0seb3FP~|&E
zn_KaJucJ=4|EZ3)-IkJnK7PP&Z_DL{rDTMwl)A4p3Vs`mH;h9RLs;-1*X#89uW8EF
z-P<!8y~qW3qQ(?=|JU0*&E@lG#J#j`4E!xnE$bu^pk#cv%V4^jWeFJ33#D|)4+&mx
z2sEYv9dz_c5?{PsZ5QKh1srR<eUKnDVHeYx-PNFM<f>GITsRh-*nCdo&+MK=?SE~h
zSkN==hc_UW)64_@z*VV~{DSZzX|4{lrJr&rY08WfkTRQv+TLR3=3`d%0KV|F4Qusw
za2L+Va}2lw#oSrjWh(h!GkM>@o7*mn;9YUt>HfxMMz@5S@f`?AuEyw&u~3EQ4J0Ay
z%@_*G7#4{bXcC#pt%I9w3;x#WyMh26^T-8Wx;$vox*~9FfhMoB5wJCJF2DwN8%+PY
z8yB3_htIl@3l9NXe9fGPY-+jTCblQ&PKyQ5_>M$e$$tH~mb;bFnz9$mc#PgaV?*rU
zPu!`>$z6~#kxOeQLH4=QkA;^V3$F(NSO`pb?tO#zB>hodqw*iwxcA~%qnOVIfn)AC
ztGp0^rl@OL8#fbdYrA#;j(-%rqr599a_1U%@Kz5?d2Rq)R89p_V3<$>79lCM*yV<z
zRFA1jl7HD+02Z;@mk(WG;axGQfCk*<{djuAWLH|?jeF9c)9oe@4mT(tUTeqh{bAE-
z0HbNIvD+QR`-j_R@Y~RPi3?!IdjN(rk`8ZxjBfxsnIul=SIZCK!J}msb~#7Je<}VZ
zJsz=6`{S@x_TNri4^N2R9e(L?0bB~rv&erxaR_xpi#BNhYTH5PsT3)X`xjpKL4H8D
z9y7n8d#)szcZUrEcsUV-GVR_+z1l9swcbsC^yt0j@cgwPOU3@OOIz3UNa>hHW#A7q
z$;_|eg8kkHfQx`b0L+1axw#b!@CRpu1G@=Bi}dTFkELZb{{3cdZf5hI$mIzfr|g1<
zxXxvsF7yF=&2boI&Uqv(71%Z>m=r<6;?c(&B4~8!PuuRH#B2Jgbn`0pTz+TeC0laQ
z2hiGPc{aD<C7tKetwjy*oE=v_(ue8(xSEt)diBnz;ubar3`1G9->o<XE)DFP;FsnO
z#<f4^-azo*mfwX}Rp~v@81`exc-ijfn!f6PSCdYksK)PuCeh1x2{6W_7<U!sR$p1Z
z<IDMY#NI<E$LPkTB(&>E+Fmq^(+q?)m`u1+BAI5VKv;o_Ca8jTOqe^Z&WxmHeInHF
z^z{>B#q<p|Ft5$e;z&XMc$wV$tsP*h4;~#6Siin$%5$XF{0u>|K`f?vr;SHLG{F{J
zut}w9EzeX+p-OJpWG^%bc!PjB=od>fLo5jRs$oi58%9FGAt2^nkvxObzHGNMO!4$i
z50aNqeCu=h8fD#mZK+#lJ%lqcD9>N%(qzBiKV$!*!x6c=>qw0%!ior`65YCZhjwX1
zIMIY=yv$G9^OIQ*?wrqKE&XA|DVhnLf4dZ`v@upw+TM78PxLf2%dWqfu>1+JD!mqQ
zYl6y?U)5D%d)*XhPs+-)H2+t|H}6K*+WJIaip<42C@qW8en%cTPIvcWDg;zbx@pW`
zSBklhueZp(TV<a65nevTTXuGX#jdas=D@#}q|2gJ4XZb^=6BcMa0i%x0N#$#0B=q$
zI>6O;V2v<=pTib>Uury2^vpgmo~3lh6`}aKjrdxRPHsr2_;#aAM~UT(sKEsuR#@|r
z=TRo#3EqUQPsZ!kLn`G*BUY=QM4M-j#}mw6TJ<bbP@N;?Os3^uRfZ`!cC0^!@AoEH
z3YNCvc-903i4~oVGG#Bj&gnuE8@@faC$2ENczX^VJDV+OZIJqQvh#4z%Kp#Sdd=<2
zJq9XH#>)gwx=<WGqBSeQia3!aL&F5-MY|RqeMJz96rB-^#pwLL1#tBeK<OFq*1$F4
znq<n_kw<2`7Nhj)NnNs&v%2s4z9$Tq;npT7B{+SitgUKY&8w$~c|<-7{9vjFOO}Dt
zz=EL@*_A$@%LV@!@yq8}vj6He6O8+FT!O*NqY^jx!@qnTv(TH4NjcG|{p%Aw$BGR8
z5RQ7%k}DMUuTK>G!S~knO?9%sUFUaL;<6*XECy)bk8QSbN0?lsO}9`%N@R=~{qTLC
z-3ts11f9};|5tYo{GVP5@8@`*w2_dl7vV)e<yX<&Uwgj6px)%2Y&8R(bA}?rGr3hL
zq!<*&96{x~;<>wl-P`o;=ef;xZ<ActaLwshQt@Rhq_DoKJ85E12@ELMUebhEceW>U
z^FrUSMTu1?5|W~m!V-!sCS@iqoa}XH0N37utu+GT=-`~TBj9uAuZHafPztFd`%0Q5
z0Mg1;=$;OZ6S$OkLmwmxK~jA#XChqD7ySJ+`>p$%P4cEf?|-PeY)LyfIP4B}e|Z+x
zI+0gYB>VCuQ>2}ipIkdZN-Y+CFJMJ)#?y(gzua0nk=Y2=ZYQ4VaDMc$B-=1K{?6^K
zgOs&jz>icjbgAlF?x}0)2F|$Xh4sHj)eXC|tBcj$NWD0xmdzk0GYi5B(Ydv=0Dghq
zSw<n^Nrm|1KduO1A}h>jV}knl>=-}DQYY}bh~9Cbn`!I2rg?D?K$Zdi>f&9CL-9)2
zuZm4;_xa-i+^D-44H<FIs6*{R{=o`YE#5KrLV=&*z|%y_`+Q4ym3Ls1k?u3@LE(l2
zKm1#1Y}exq#VDl^&ifQ{ju#O__UH@3th6i7XD(8c^<q{$<n)gsazxB3iNo57!!&0T
z$orCOl|d4u$Rpq2S86UDHmqNRS$<W_mb0!oDA%!jU$sPPjt5<^hLUF=nO71=b*fR@
z1WR&yib71SRSo#?^d(V#el51B->W>NuVbpfuc>+;ITl`1{WpkK2tiv}V;o%Hj}V9D
za^5}4+5+HWve!Tl)3@%PQ=>WEn`(I&>A2#GGG2@p!Ff=N7A+T5C9Czk>@zdbOcGJe
z+URFn6omjV;}GV0*(<#$ZVXtZ82Hh`dzlWq`#<Px*J;r;1gVBQ&MD}mvy&xY*@*9^
z9(#8~I7&H5a6VQW)LJlNQ|7v5<SdrS-T)Q5og$Vp=k?Zkk=srcVL{gs1t)<t?cF!>
zS}`xuzhbGfLOuE(jXv?b{M_8{X^s8a9|!5;70#?2xxU8YhpyM`fr$PFReLdnhOSvQ
zelpR-XeJ<iwT^kbuiD~r)u!r%FX|+zFlXHkMo6dRTE6OmCQr9r(%u99hSuk%4;;ij
zCR(<QPg7w%Dw(RviN9B5Mr@uC-yR((y_}3uy2%X50bG!lJHKaYJ~&pWatZc5)8N$5
zHKE?DU%GvxR;8$)w0$GhmmdazS3jv0yfU=DA8<StQ*$X&PM<|o696#o-zRV^=QI_<
z8J00U%8Egxh@Qf?F0qgLn(!?T9j};nzM(l=s?|&7uYAy*yOvs6M!sd`a1%`Bao4y5
z^pZI~f-*4Q{7Q4Jeh7Zh)}I2mA9)aOx(V4VIxyItX_UUb-Bby2I$UzZsl<bY-E#td
zum?ub3`kV~QS`s)^ASTrR}z4%Lu7vo*Y)z@BQ2+{WKF=Wtch2u6j}d~ti^zS@s@#y
zd2_k>`Xc>pSjT39TKv1+uld4fXXw_HrjuAw<!$*<zcIA$mc&Dm)xqIC;4_nB=pWdv
zTnZaa#~HH^y{75Ee*HR=ty$=>7Y@t6!0{cCdB1)~^-jmu=LHsL*RAOYd2;S%Q^mAb
z-z{hTkLJUHjw7%y&1I*p{USpvwTBXT@g)zy{|N5?3{nyU>ol0bQsd5ECMRX}DWA2r
zRdKbc6VvxPeN0YTx+4}Pd%dFN1)S3-{5UWPNHxM~1J(rq<sH5VlsvgafE~&+7a?hU
zpg8cYs>)n6<5v{{qF}Z@w&(XH68%~t-fG>*r(O8mxV`e>xxaJ*6xlm`^y|~DCjDcc
zoUexQ9(6kdknE<_$Io22ABtktPCGgsJ2FOt!Y2>l-`}P!rtqEQ)}6D&XQ%ZX+^KB-
z-%6zE6Agec0?H0&#iWIMvJOj8-;4#~dv(n<lj{5V*V+nd+?EEY%?=w!PW!7t%zz$I
z{(R<=c6#wvDe2N_N@B}MsqPfLy`??omEGcd?#ve_ekg2LS8^|ti}E9>*tsd&q>`!7
zGb`X5rot;(zV<#zF=A<{d=c6lpihSz$m~=?w9{BhQ->~kO@B>7y%c_vP`r*PKD_av
zkdajNs8hYykN?N=Sc%2%j4My_zejDmZs)Znk&N;s(yMwODZnii_5N9?A>8F#59J8D
z{%mnl+kRM0na0$$Gl(w3a{!T#o<Y^3Wm`WHq@WjD!sKV8N*fbT`=@5$PX1}X#tlz;
zW3Jt)-d6n)0=sTDXXT;$PGH?i$ExbtsE2eUEe}<4{ZF1CTJ<D%;@;kD&G{Z{u0L3>
zejQQ{@O#SF@7s*?I(7Y@83^@+*-C5oxN_!ptwUKk74^y7m&|gHKK6vOo~!2irTtdO
zR%-ld<P;sjm3D7}k2+hOzf}2IJOS13tEs)W1K`PRmEuz4R~t%~+~)<Ku2d4Mo<v)K
zw@Dwt2a4Sup-)Hg^1WxTHosrpoU)&PMhSoXxwWyBt+Zw8vNBnl|8Fv=NB?0U?k0d+
zzjo%m(`sB7k6d~U_{N_71Ex}>K7AT7;IoX?1TTsX6aoJH4@OPwX{{l7{r-xC-R$cC
zq|S}Mx~Uxre<ac1+UmWxC08nGY1|n}xN~e8HS;y5uu1>uooQ`B!Ce|vQKkc`B99&2
zDr?Qvb3yM*jBR6+IXkWHK7B*7i}k8ICA^xKmx6Nfm#H;Bw;!x^vS7zt;D5nWfpq{+
z|9i9{=6jEz5CB*<AmV_gUdOxbV!n&?l}p8=uHc}qt0$E3OW2sz`W@yCSI@)O7qb-=
zHY}#6eYNT8xiRJYzk`N|X>9?R`HvV#{d;q+C%<n?sT=O$$ier<(>6N+&i@WDPCEMk
z3@QIBcDX<MH^Q$0=O*e%2KBdZR4!#bX}GA-=P}zR9E@7ybJ=QKqwPIDDb61=^I<#6
zjFRlw4wEz4TfCCl;`f}Lc5hN%TPB5Dk>wNozr44S4W1KUMj(FO6O}5b3ixu;`7806
zmEYLqG2bHrHWhiD`0}Jzj67Dm)jH?Prukzufd5Vu1c%m6`>-6;nFbxYxy}0LOCiYb
zc8wFf)<E<BTf}KPl+!0%h`y10p5og=sz@;w`flnN&uup!Q)jXs1tjmjqaGz(rb2Gg
z=H^U32Ww(wju<B^86h6G0r5(f4nucr1x5YQLA(eQMXKkW&RVekT0J(QIMBoBODY%j
zC}hpo1zf!3c=BOlruXG1k^O|p-mrHTT*Z$-TEK?DYsWtM$ID-bzo6DgnBrn$&ObuF
zz0O}{iHeIw6$O0;OE9R3=3nui=d`u=(jYs2B;eY|D33#<u2yo>zMVf8i4;2=FVzvL
zb)?&vifC!cSm1nH`ux_O*s=2-FK432RvN;C*@gO;>MjFzzf(}<6Qc+6R+;l}M&}<b
zVYt_I0(V<(2g|NfxN4d|c$7(eTD88S={Xnudc4At{qE|YkQN+e9i}T&(8SEh?`FXj
zq(bv40x5XoAe;&>U8XQnM;xqX@iQNc8SKmc6Vh4hU&nVAAhviPAXDUm*(A;#>a%Dq
zh0M7OG{KaLtofHhs!+P^27rap^V{w8r-}SbX6b!oW-Ye(afyb{MdJ3@?5g}b-;<kO
z6`q8To&_^Jim+fJ32Rp~GK$PhicME@kXia(3I>I_uTjvyC3}rZrl2;FXGncs#PEqX
zMK0aOief32ZXFpp=2{}7R>cZ+GO`b**>R(OfO#NX{L-?@&S14MI{#wMliT!g&xz<M
z$8+i3xIWcEDfvdeNIdV(OxH7`etlTILCxZ8rTR<`t3ejRB*SrBCDgw!f``_flHxwv
z+53JL1CmgSjeYgZs=z1nb*88?>J6*T`_zd>61w#X+D*~_F%9N97WApXOVixMbEO&e
z9(s=_`V6d{n@@F@r`jKXmT4`1t`t5^NC@=XusoBZl@TSl&VsQM>hJZIddBs2ek$%#
z-L%*lDp!^_5Vd!{PM=%<S!U8>e>yV7f1Q9iy>S>Dmal6!Gl8bEZkCB!Z~l>~r~ITq
zHHF=O<S4D(h4q%Z7J#tv`0a9Bl(jA(UE>D>2J&P#iHZKz>*Es!defue?Ug<T`dk0<
zHIw!s-0-RwD*LZbbdy+^0myx$aMPwa{`HCIZ(Ra8?f>~r;gG(&jFm3*b^k(Hs|hZI
zwwxEPDuGA3nq%&k>G=ch@9Hft|E9T3YMVsQqG{_Wfn5e+d9G<vWS#TO`+Mt>Gx#9$
zSiBgaO4l|d=gYsM{ocCl6e)o`k>$nct^mN5)&b=u=3d=)vlgJNavfG~QkyLfN+kZ3
z@AjWP!B*bw+LU1B;*v8qW-LV4R#cEYcn~Yxpo{nDfspew)xGR%t@oe16D(UXR8mm%
z!d~oem4B}vk<=9cWEQUP8vA{G?lb(xy?ZyAPjn$tmgA$_uHd&Vw|zTwk2|M&5==2i
zuu>%fxD}<1nK{$xQ*2h-H^F|dT(D_NL!Z<|tUSAAs0bH6=nEI)f#y!B#f6Jp*O2az
zbY1<aA+0@gE#@-@vf4<uGYP5kL`93KLBRTp`F>OH!^v%Y;CsNGOvD2<HS6nSh8)sl
zljwAF;jdhF@5CO!vXp0ycZnk8)(&hsOdQ%wG=+0s@-JOnBbN7gRL1)+dsDO5RWa5`
z0ok-TiIn(%5O>tZ6jO#7;$&s*9hE5Hs+S#<wbmcJQ~7CXbr>k={AbEm3N1~}E(wXB
zc5l-4x0tB3k-neU*7<r+$2=8_u<Vd<Ugfc!iaXD;yO`uN-*ovak5%ZT0vfnl7W&p{
zb`Cv#On~6IE*nV7^vyFwmR&hV&s~;;V(@_4;P=+QCFnC&wSD?n`-soQ>7^uL6dc^y
z`F=2Khxoz**h(f-7>9O#mO8%sER>2u?5uJ^4N*$HR4viz9yU@3Q%V3FMVjx?_ChY@
znx#kJONzqa`QJU{p9qJJl>XErdquBV$WvXaCrSLW{opL9vg~tVcOg&hRnc{(N$HyV
zJD2&YoXI=S1I%dh<Mad~yj9&D&;^uU<~EMb+pM`@4vI*LtD0_Er(auoMJF5mK*_-Z
z#OE25f1QTwH(r!j^#=z01<V6Wt-L|0Bh78$$by;?QRBo?K>tI~FHvleMQq%dkZ{8z
zljyD_k*4C&bj@iX(F@m~^choRh7@{RLGSBD0QE#AW-ZU4uB5K(OykUO$Z=y2$d;gY
zc9)NPzga?gc;{;hz||@Vi|p$9&^cGN+U_Lxn=NJxrrI5Li&h$3k^=ojkVTKKVITnp
zl<E*}#0Qin6)m=SU^)><HqyfH0Dk@BzF|w5_2WS3kH6~fp|tp`QZymKL4Tx1k40%O
zHosVO2cD;o0Uu;2b(Dmodezw|;jm`~wN1<HB?&gXPN_WeaW&`zfSh`A{&|bT`!OLS
zb%0in(#PNdrNO`Ne~O={$<u886q7P0Z+c&%&_CpFY<LEOO%{+gg*5<t;O;hC?;h_H
zFOM!ydY$Q^-?2I7kGD4^Ke;J7U=RjtEG}u+nztCm1N7$3waft?RktGzsS@g)2L#VI
zzm%`VyBg6&Ot5O<kn-CVPHL?MSRweTHCcQppg<jsf?kQ4&&7P*B2@?AWtQ4^PSc~c
z<^cE2Ct%kU%Mvl5UOi?~2-G$Mx&n0l0h<P27nSBVN(g!l8Z4=NjsOts5i5=AuqFGa
z_n%XpTYKZi4W-wz(i*+^M9id=a6T7))grTXi^06<xbm}ucP-*aUuxj}Ky4V1wM{vo
zy3iK0mLh3p(j37UplrV50*v=@p(+WQJP`_}M^`s*+_<{(J|Fr1j~xRWDR{|b?FXIc
z)OA1lP}X#}n{rQXw!7K0&J@2V6QISDd-KHTVTd-_18#AiJ5P3$#53G3HN|%jFHOT)
zW#@0Erl$vI;Bt8OUY;FH%507HZuWO4eY0q~FovbBZjO~A4hkAhg+@lOtD6}LfA1dR
zq`lhe6Eunt?}lh2bhfLjY{m{*%pF$-%?FEnL?a`DmL$2%!9B_QN+fJ?nm-Y!Bj@`&
zBM?RAxEgPa_m7C6S87(@NTpzm!y3#BmzkR`_sgrmx^ZzeobzpiHB6+6$WAF<t<av(
zl<{81Zw(oGB@?F6PQlq|Z#g?o?3evd`4#etiDA&5q<&rmU-<%9*L5ZZbs17>ZnYv*
zgSxCOReFz8>B*UM;ex!r>cL>erp{!I*<2ym&GIO5aq5+sh_R-18Zf1x%k_O^-8n8I
zwUi(x8;zJe6j0%4*H%Qfy>{VVMeNoz-YhrsD_fgZ(%Y@EZSszg2DzW<#l`uUiowSe
z6{iuSiXfyk=%OZ^RFN4mN~1U(r{q;lu(fV9<jC3gczv+}Yj^qle|P$@GO8^(jLC4F
zxtG2XHz!!XhUGtBp{K#Lt4+Jf+kDOj1rQ6oM{f6T3UE%-^|gz(*m318t%z_^Nr0%B
z6`Q=PH*Au1LQCUnLSoj9hP^QxYs!=@TrGBuih*TRxoWkkcA@M&Hs$7?CIG7{J-=5i
zfZaK3_K^UG_y8G!U^*S?*An;-I;LoKT-1qNDghlIu$WjrndH$u-6#Zu=G)$SRaYq|
zn;m6rvO_?SZXy?Amw6iY0F-b<12h0N;vZs;#zAgEr+4*iyO3ix<)uFQ9U)AlJrAqQ
zOstU6A*D658%9(dJ%bxyGa+naA$a57sV(r+rg0e=b2Fvp+zAB*1ti{AMoTI*G%DO2
z30x0evS*c*nb#B+7GxKH?U~`aO@l<70t^|fDQ)ajkx*Xbg0Wy@tKbT-f2+ySYABsB
zWF}~unm`ZMnCt3IUJD7Jivz6cW}d;JvlB~3R>SdwbOdij50M&9W#2%Gj`N{&J8b4#
z3Y%cybkb*Z!`KYieP2L?Z91GE#)dFKdKzwTtskm-aVjb{m2VsZGI=4EfU@D;s73nd
z^OYCH$3Z)<H5deL1r+4jk{m-19-w4*QU`MNjmlpj3>#$?6cw|wvKTXqMu!=*GBRF_
zu8tdZ_e=_R`XFo(y*kg-Llr|?r7VNwNJv5gG_*7nnpC{aFKP@^B)ks*re%Xc?oG$D
zJ&u^YnC!B==Xd>@l;UQN?!MMwT3C2&YL-jupDY8YP+WF4xJMYUD}XzPYkTO=NtViA
zTIO1|2k-{vNUTY#->U0A$vh4J42IjyuUoAgWtOVM@R!n2;0`uh@fXH@%hOLHsyExm
zq8#;wbYAPlZcUNccE8<K+gL@_J{8jL3aQOp<v;PAe8>mBQ47e`!%Ekc1FR3Ikziw`
zr?QhBV@2|ZvLy4F6CY9Vv5!uJL4hA}1&o8~<2$$<eD`aHotZpUt_a$f5v|P`5}kN3
z@h$87{(6~}f|?NDOd<MORA=4#*yH(?v|m-5PB`wSSa{o29e(0#9PoMi67}-~Kw?Ez
z6_}C*fDV|><Y>}o7AYS&Nf4jZ-5v|?5;UT49nr=0*GJK8o74NtoP3@}JdQ&C*<*LU
zFZ?uqq8{4th4LT7MKVAzxl9m1N&Wzdc85{bB0K41a~_tqj~*c1y*M9z07gu7xv#JG
z7oL>bUS$aMRD}0`2~!O~8N69aCi-v#i~hz<+~+rL{ZDUwZruz(rQL{<dHhcgUw>)A
z4_L*-mFJ}LPrm;5Nu@sCXxUW#5MLT}x!p=w!FX&lR#WV}{Od8O@-^b0UzmP|6Sy)5
z1<Doe%}pr2Z|^n=qI3RG#mVg|?siyDVYb=mUU4!Y7z60>=mg^ZZw7a>$@#Y$I;>41
z>qJlQNor#p`=CNUF}|scosp7y{lXhxHLV`$|4;P&$HjlJ(SIm|-=()O$!KWM^8jCl
zZGV1RJIx5}LwCJ@g*m)!{yPI=wpM)FeQ`96u}wRjk=gB3@Bd5yhtPA2AAPO7$Ynk!
zGalRJ^yl_Du24!jNcTGJv!pb4$gCFnI_rHH1FV}@@J!A|$3Zfysy5h3dxU;To~}Nt
zU-_*MlwT*TOrMT?GNRg#ei9V%)%fB_rCLO(avwP+Ty8dJ<E4K}0IBsj?QY{!;Q%|O
zxSIZouFVFQh@Gg%Av!`zd6xm*b1<=@nzqx&u#;Y+JEX^_sI(CkJP<_|fTI37U)~w@
zg(cNXPepP?_N4VS%kbVzE1^`h;nBl5CC{~pF|$5_HPs;d4wz++#FcAWxcHnsrEkA(
zm$&waf?}W{`0F(iba!`W<*`<(wP|W<zSY%bvVq!iW6Z(HMazBDu>-1cEzvKYvf2v@
zCBD&DXAha#0?hkuC_K)`#$U+vx6)Hi_C7Z=C{(k08T1c`5Z9XoV9Kb`E>+-Vs6tp)
zI#1>E*BUIcS8@lGkC85@j@jajP1slz{`#FHK7P)(ROgDp27Deb6dc9|ApoKSn7jjC
z5o$yUj%qVsvmj}$k;*@=krV8MayTQ3YxJ)E%h=q{RsoAwL~grm)dPMB;MWd#BI+Qv
z7AWn?1BfTW+AFrzAm1<Q*=P&j5Of?!QD1epU;8R%cJ5BWJX8X=s8}yQE9u&581(%`
zq+2$lc+yEQ*3BhG_&ZCpp-N-iu<pGBeFOQc*RNlPo#*Gjex<Bj?YuesTf}F5c*tzi
z)hRojRsCggzXq7T2nuQXsPxFE-V`~wMM16<Z(d;lU}(yoAj{(~uU_dYQ&CQtr&q!O
z<b){!$lnXP%qAnZJZyb|RV%2*Za7)QK7S{fmWfG<Q2gv2Z0{w{+gkI-4@2P+@Pp_x
zt_Bt>e!cSlQFkH^VnfW6btV@@w*YSm0EU6<lw<%C1Ox^=Ts9bp3;uW|!A6v)9SC;3
zS_?S#LsM@I4a#$Ao~6a^zQRF_s$}dp_$FoQ39u<!y}PF;+KAe_cW1Y^a^UqAr!N=q
zWKD{42PuPT+3RGf9Y||>erH|y*}3FepReNC;YJKn@?xDICV8RhzLOo_T9x8L&3M}{
zpH^`Ced~hc&V!WBqjm~V+)}Eq8cDN#i;q5psflWb3g*~p$eCz*6ow5_gu8&}bAP%4
zeT{#@wtfekDYsWVcPq_J49$vi_#Pk8L0$I+P5{@?>O>b`QN!LN<UV*$>#vAzZH~z&
z;hLk=S8X~^xolv;wB^Mmd2u#}31r^NK8KX`(CyY2yEb83);6*hsNEc=A|SlFcK@Jx
z<RHWi4lXKH;sC-u!7+ECJDl$NlZy@WhmSej&#aNxR;j;x_*cL<yD{x_)(wO|ob$*E
zx;1vl60>*|36YDFM#AqrBz&t5=<C{y|3<;CRrI;9c8blQ=_plfA>H5iiD5$#ODW>q
zYp^GX4#v!q;uUIJ**EIAg>q#aIta9pzqlM<I677+sQ0q$Pi8u!b9?1gYyVw6x7vI_
z!X*Z|RVOwdpQ|gVG__qX<b@E-1Hj+t2ayZvVHMyA00(g`Q~*eX5Z>k{*B+?8AI|%}
z3px1T+I#P)rq;b{bQc>cC?X=#6a=IzDoD3bq)U?;A_7VgkQStGsR9Dhr7OKi6%rs6
z0i_B^FCm2937v#~pM|=`eUA4%=Z-tRF}^Y0{}?f5mFHLHZ_fFw#W#1p%6#h(6ZQ=$
z)PUu&mY;6!L0^B0*F{(EYL>`xZswIQ1;C@1%;@y^rI;P?#ABmK%zUVdqJXBt4Rf2x
zPZheGDB3j)Q?Sal<MbubPJDK8!po!AdTrX}tDKeT2+g|#Va_hLH;cB@l%(p)H)rWy
ze#i>j#K)gIS}@mF7;+e2q3y6XNseD0Q-{~*I(vKb7-94_=SC+JB^x9w(+0ZXu6I~;
zc$LDrVdwC6vy+KqFWVJJx}%rl$0WRHL<wFk-G@5cEE<oUt;z-!z;+;?lMAYYvK2#f
zH2`1#v~($S;ywO2{`0dn#vNG`Za#*wgid6RSr|x&z2Mi>f`WezS+gGEmK&Xz-w}~I
zCEIa`l=eJod%5O|pBUUSS;u*9)v7BpwQ)Z195a=Ck*ay=dVHno@rgq!ytHTV@0ZOT
z>uVWY83{PYh$m%gxXWA))R=j)-K-d~omqnblRqu(X4z63-A{-xvJ>M(@QOpo84IGf
zj^N_a-rUVYOAGD<X>T$Pc=MXo<*@1@DO%0PRC@gN`RQRgHeZ~~?t!Z-{p-T)BXyfx
zPT59<(0?p0IkfJhX2#KolY0CE7Ab+W5SBj10`81DrW~mTO5<J`G&J5TgP3y@ibt!=
z1Hh|$hUX1t;P{hq+uOTMp>1u-y{7Toqh$oqSGB1k7sW8|B1%`5Y}T=LiSATMq@=o`
z2!E&5&fC2%9~3Huk#nP2)H%|YN?4Ehihh>|H#XMNS?Q$%8vOGqNeUO!X%vKw-w6xO
zSqkiyT2~3!CORj!xRb5>moC;s%Y8ceyK&89Zb73TvHPAwP$N9qkhOugoNL<)MS}y=
z69kHnpv{ki0jEG-=mi)>1ly$o+S9aK4pKA<&I6>6VFv{b8V&&1nyuYvz?k_jvjV*C
zZD{}DmUlz6MbmL9oO$lfMm}tpPGX|Sc^l3nd+XM7RaMoxGi4|;5!FTYiB=K3M~K0E
z+1jg2RycLaOu<p1<7a8JXPiotnVDCul2io58)pePvQL9XzTQF>yQ!0^$4Mg=C*T)R
z0|=oi^E;RQomwOgH~k%!<_L+y&<Tla)}WGc3y2W_NB6q6Ubp`(Foz+H4}*CG_GqKd
z@|^8V@q>q&6VPy^ZCDS!2<kJKH@7w5_UJ6jouu=#<GGwUQBMAH8#4w1%P&=uO}n#)
zWLwWEq(1$e$6BYND8^xjwagS=?`XGbZ$dRNQ^7BJ(>vXpT;F8)94<oGQ7anAe2k?n
zS>#mf?(k6IpG2k;uyg@yb67&ekZ{Qfk*7IZ354)PZ1pM!%eLAMV%7Etnk;gKq<Hep
zdfywZ4Kw@S@ANcfPd)(W6?>_Xh+F~i!wFPAs2YM-Z2TxKrL}Sl0t$)dB2;pmGo?95
zXR}ODHup+oW7}SdL|t!=hj2>xnCrmn3l*ZHC|;Y%2U7)WeOB|%Dq}Sja8{wixWut+
zM|{}T7D1_+m}fD<JH!xP$7b)Pt@ny`k~HRL@ycpy%+Y48tU9hExOT(24+<)c7AF|k
za!NO%<VqeU%vRvaoAE)fKR341UNfe!YQ42wc&l&)v-F2oZZxd55)=#}B>)Q`I6(xc
z1nQTPJ+@!5R^KfT>@)93QL7k9tONIJjV^n**=FB;%_Z<fFeZW+73)$TFgJ}6V*_A<
zv$5z>=JGf<tVDHSeg3$ywr<?Y^m0qZt6T1NB&kLk1(VSWo{s@=RJB59i>nCgh}bJ%
zmcO%2<4(zOzm7HD<%~k*m&DqXA<GDui>Hp=wwOWBfMWwLI|H}AH6CqYkop$wU4DMH
ztGa(O;-_-ZWuaYgo7hJU`ahI1U;+YN06Iyi=^sJ&n(1?ad#<asAs-8`otgnT1f>(m
zsuc_<3!vToT>*95oyO*LMwc%AuE$^NN$nq?#_x4}K*_v(@lb6dme9{io1RG%K*Syq
znD4h-T`S)4a;;0I$T^a#Su}!-PF9SEdtlTqiCXs;FD)>&Pxrd4!gJ~^BwrpU2v}_O
z@(%NR%P1`{A{ktW7hYErPAo00s8^XCL0|BCwC$Zc^RNLVGpOZ%C(U|a>+^5<zjr0y
z^IyaDi^tllf7gb0UXSd@!mv+_uD~pBtrL#ISw_S-<JaF(QN_7tza-A-1xU5Vph|}3
zyWw1De7<#=Gnizz7CWwvR(jKuwDZrFKew6blHb`}6B?@1rXzL2iP+V(xF9u`it5$j
z9IlZzYD5@{Fq!A`IcgO_bOv*R7mw|o9{FJtD`qOjlpN9w0Q{*gdthgM$v`LW^~wK7
zW7_Lk0JXN0G0xTqHLnDXT$}E)uKbwa4B$mKvLP6BFsD@v2vMjLBeX}hq;K^!S!%kh
zwASV~;vKzpKTb6JqgOXv2VS|Kpd)8#idl?;MyzrHot$^?LMvd_vBHG@V@qp7yRzmu
zeFAK(Lq#DxPGq`5L;lm?j75<Wy~8NE{e0Pps%;@#Ep6_SLE-huk-)JfF~wkt02(^_
z=xbdceGRKWlEyn$Pnf!!OrgdOf?X>9w;Ba4KnVa;$xl`7Zy>&RNfy*r7ane$a|dOt
zH%_C^i=PQGVy5;f|7b7pf9d!^SJf5!%zgp`=%Mm3qgU~t{3?#6s%co1*(L+>p`Mmo
ztKe=%My6qzZFiWPn;Q#35mj9!;pfgq=j&ckWrMyJm2FMd-PI)nxR==Nny=If6>;K;
z$^F}A@>w?U_h<-lzpqHf?IUL7GJX&<6<lC;H>l#EFs$^=NqUoO_&hjG;coZRszLu>
z?Q{c&<D7FpuRlcIZItut@LiehlEtGZ>1&by|ANHjw9D49VPljWqnJ;!Nd*N-nr>G8
zxTq)(s5NQPVPx$!qlqa`w?CbLhjYZob9zb~R6e<7n14Vk?_$O&tEE?0@>K$FHNOpa
zaotbOOpN+poJ^Z;@RgbBPS1IVLuS5Dg|Kj`=q_ooeb;F=PVVEov_}3HJ6KGTQ}QLh
zPhY*ut?H@u(EKGn@<8Pgm@!HUNrGf06<_IX&qz+zDn6J(<ybzf|JePt{L{>U!4^Qs
zCfk9pEv*<|<a`7)<8M?}={H8`8Jf`lwLue+P=gk7*^RZBIf7olpCHg2$fqF23FB6)
zyxT4p9(<FilL)g11WSG*zq86?kxTI|%bKAb?^^u32JU$gdU=x5XsB~nv}ww}^D+wE
z?^?*1=aL_L%R^+z?@)Pb_3H^?5MzqxiDb|->6+M>LpR`~XM>eH{Ew#<IkqRF>SpaL
z>#)bezm4E>Y}1mDIJY5kHIjG^ux!;r8U7q%e*@>7mt{sxUuSS7lI*R5Q9v+$C9g05
z_yexRi_pNwuC=_^9BNQ|%|R(<0s}^=@~}(m&woX@EX4sfWq|4mwZ|{N;Sav?f9f|Z
z5m$}Y?@PgPrA8p#X+Cn{62KS%jg2ZiSj3lLA44ZFR|9ZuuZ_%uxTX~UCUb2=P!5pk
zLLb2>ocFFZTL+MZMVDRV@}4MijsO}iNO=MVfX{90b35xk4M46I%!Qk~K#)dCAp1=5
zm!rhFVP@s~_gN$)JgL`JK~oP4Q_H_!yT&GD?C?A?&nP7{JWNJU?-4|+O6+dfPIJtl
z=B9~bnK<@Po%JmPHcqxsw?A05{aHG?I%F7$LiTlMd(&&rKZeiU#0s1Go(?-BeM|3A
z4IolmE0mli>yR*%<rD1<z!X4yI@C4+MTaZj05lE2WoBRy1mH{`_8cn1(1rORIG0z;
zE4v*4dv7a>-Xn~m|LbK3Kpi>DUds$TdbL|q6CwpJe<cNU_LBlTo(J0vBRM062dOr~
zIeo-$H<<L*0eU#L+IbahX#P$ZTphap$31P1wzBO*yvD>aCFLb+s6g#3@g(QoxJoX<
zdoMaIjN7a$%<@l#z~JC`s0ss?+SwnBJ%CaLbB_zaS-~hn8q+C281-qO=Jf%Z#B|UN
zU!1--KH}`2v)a~XG3|tyDIF{9;Z@j^0&47Rw(DvEIq1aMNjo<6ZS;0+>y6-sv0zKy
zjr2Twh96PxLVlKRx%l>>rspiiS#jbdd|Py|=8hYAAs2-%(~;|8B*nXF=)|1*mXY|g
z9G?uiC|a4AIw?D?n&?9ka_SYq8IAy9pd4x&kdOir2c%a$Cf^@mvNk@mcNjt*lvdMZ
zmcg_44som_aD%301uM~l@mN6%AOXDmN?I?{Rk)0P>l<Xt`n_*9`X)6u%-F&;5DA>y
z$i1I1L<k)R$ZoGqL42t3-$!|Zz_3G<tUUID!Z1qk2pYoPQvlz|%3?a!XS?hn=^=(_
zLNn0oZ-M&s8G@->Y>hD!AM<am7PbP4PMI?gKzcx*K=-wA7IBsn%>B^pxyNK9zu)?v
zSuk@M8XHHK+==;U@vP0~b@&`eAAO9!#dK*S0L^Ja3+4(mrqu4?$PxQS6c8kwI9h4P
zYx7TSI0ONB_Rr&d`A?2xdlCU5iS{cH(~nGF?#)^b?|#^LV~_Es!I}F-LU<L>hypD>
zhVIj*iH|{?XgmY}Wd*Yr>=C_lmo-2E(*%GYl0X1~&DYfi5LiK8FM#olZEbwE-Zy-3
z3rQ4LxG)rr#2O?GuERb8pyzvbgV-3pF5W|2X0^-V-^=^wKttx0RYv`PJ<c027yXaN
znf^Mnr|LtTwwcPrd+iCXoKNAFdrBF9Irhv|2;?oNa$3hxG#={gmTUnhoA)uF!ti_D
zdXLe|1@tJ81TbHvyT23sJ?6e9q(Xp*J5@0x&H7La$Xbj3X8h&p%iN%^y~Te(3z)q#
zJg(IjFu{fEB1bG|iCe#BXq1_pk*N9C<J@}x9~`F>?2`ktt77d(fXe$)njfQ@wRQdW
zQUhogPH3)2d()nx=D09xIB7<Xe;i1chdy8=1_uO<HAVLks`>#nZjayrOdgOdxiA_~
z`nT6SLS^N1LV*m@-K9E2;bXzK66~b%&k{`6qFtWFG&`>CGk#etJnT!i-^+hJj{Bqk
z;5eD?UuC-hAHy<`SFtVTv8d8Bdv$3j7E45Ef8N8c@%f+a6*y^B;WQ%PWIvq(3<fwL
z;A`c}KAU@2g5d?k7Kk%QQ~9^eWy^~-_JuJ(lQlp=C8ji^0mb71)UNS@yznbV#zJu@
zCvB;oCe*1WJr_=nw>ebQ|9YImP5;4h?jP3Uho)CLNH8+~m+~`*e7(mKi5W&N$8hQt
zX!!a<ko3$tG>#S)7Pb|uNKFtSn%6ghQdy&i7t^WM*>=Cd@M*;J05kYDz0m5lNVGxR
z>C-nf{{dEaJ=9qm+$iCoTQ$C9&7f#2bP}QFAGCo`=U&L~QIp^vEzV^^%*d!&Zw-{E
z(R^KVn;L+S+{;bD@bzcEDxEN~r9}!oeg@g=QubOu>wQc-CMKtpm6R@gXZiKT;C%2$
zoKb9_m_H50zrVvo0{Rv^2YWI+wLISilieIwzOg;*4PGe^NdXCeupQaq)%;^y=ad?W
zz_$)O@uhpB;sSq56r<-S&#%8x=%baM{x0Zy8(srx3ALd)Nb~>|hqoL+M!=Jl{vFgM
z&J25Tk3Y%Um-o4Q^ALO{IT`mawOZ<RUE%=`tT6lM&I=rUX*;<##i|FH46bU*{85SU
zM~p!lTL7Pvb@}ey@*J&G%-3h$-;s8l>eXw9WWEpT6>66w1!r!puSB;byt_7I{Y}S_
z1;Fr70n_SeZA;yR?6{P4(}qrkvwE*{2uyhoZ2k{j?TJm8&bskluZRs>B+puhwE1uH
zx$ksXe8+kiCy?hrtq~7Zcd2q@_5(Q6CwZ=J*J)E6ie_f9Uujr32Pkg#G;K1nxc~AS
z<>cTS|MPEzFzzg6<``6N9c)8c#0%Gx_x@5LYy-b2FI97S8}rF;?5#J0+0t<|URbpY
zUZEYb>Abs5XhY%FhFn6jUtijsM_Gi_=KlE$t?~RI50Lz5L$R|03=MckeEVpm#pZ-O
zuhD~D7Q*H@#=<b#?6Ais%xcloYO?b1b^Di{WZ@QEg-)3zITpK4E1kwxUvd2VtL$z2
zl{Ckg{aQMX(**P}5+pVQnp#1vglfzlSB2aYQXvWVoO`(8)Zc&}2u(8qIdX$@YrPMK
z0sUz4Wa5McKkIrBpoZP8ULHd~j<Yn;I<a<4av&RpFEK{d@|O|@HhJv^gsBB>UYw?)
z{KRi)2IIL5#l1wbgz`O&SFQFxfzJT7TXPK)tg?F2Z%-RM(lRkMVJ6>-6*hP|+oAtT
zUt1{b>KQ=A<}0&ta@rvI!|%b=xHh_TRN$HwX6ldC%Z@mqpZSD_g-I(Z0Z^Qgk(8e=
z^IfG!s&$AgZ&?05^FYN*F6n*}-vz7sNfNeCFbMU07ouz4K%JupfzjCev=>s1U+!^|
zkkGLQn7YpvaLWEI7lpfQYS}p%{$W9&Kgj}mBe4dtvw%1dCM*L2?3P}QCpK`RH2TjI
zPZR`(!hCpL*CUiQVj};dwpaNXu<EDAu~=6`a~zb2WPfeTV)EyO_l}#S25k$CA$*Bp
zKeVyLq?e);J|3Z+1woatLxQzjIt4dQCL9CQz{lRM7!NQYcXX)ALbE@1pC)$q4@32&
z$0%JZoCM(p5^5+&h|~ku1EDOg$Oo7`It+Ze36+{XRR;+;^RKQ2{V(~Pf6Is38*`@E
z#V`^ekllP;1X>LZX1y9iF0zO94|_(Y=Wecc`xz{CcFO>nYRqFqvayUHcD_Bef>H2b
zb*#z`wXavVF2PQ7VJyOG_KK8jcQ(xG6-Ur_Y%Im(oyn0g7A3+W0S}4a6Shtj8M;{-
zB>fP!)))F~li!(XE;-766SaU%Y5QSiw_dRT4ewoz5}Qbynfw52@%SL^!?#i3No}{y
z{OjIn57-3cK`;O!o57_)_yuX;W`^=F-1~G6Oa@>I+q-V?=U3(DR%8B3=hwS6Y6gaU
z+gf!Npq>7%_jd+Jt?U(8+S89xs_?AwPV9H=uvbqW!PF1N9;z>>jl1ixjmKDc1+Jg?
zrU%J6KFfHL_i4O-u2(0ov`)j<q#VIXj(}M<?CED+bZ{Z2aJk$$@W;r<{Jj~>Jv4cf
zDbr9BQ25{C56aC_u1Mn7=u=m9_W{_sJTF$P^nJR&;ie9tI9cdpa+1N@|E6D41cvMg
zJz+Rn;_T8Y^cr1w7wl^noD!qXo5|PvnB9007IS{~5h206*Z313FdU7iIu2JU+vL8y
z1-G~fMp__EqjIhoX@)~nAru_Ei-mY%!+`<wU7EjxK7g>h45?y=na@!ncAqW14yB(=
z!@%r%1^UnU_jK|^z!7=0HiJ(m&U(NO`-Hqw$XzbfuYUnkkI6p`2O#a1H5g64UbRqG
z_}8^a;-t=_ng1<0y15=)_PYpx@|wYv3B>NbWoR~M=;c+&oeO7{%Wu3mAl3j43$&p|
zIz94s8)byPJK1qghD8G0v*jW)q{hH&VGT4f_m9%xMI^6|Fd<+pQ^N;<d5KE5F+dmz
zB!}zq<X^|0k2f1>PKp<98SDE{s2ddkjuNO6U?}VL&i$ShP;}@8V`q{LH6IG04X4(g
z?I|mV4XLRRwg=2JlC@FUyl-~NhEneK%yk%>t+$xAtIRd49%oDMP?TfsS?|j;_?XS1
zpb0s?rrs1&*+O*()K@y$#x(%Q4Ua2_zc5)GP!tRr`0uWL`&lzu-r=uYj)!a+nut*@
z8dLBv;h21g-nP-g`js$KJVD#m=4a&>nEmJV4S1)5xJC|O%r&bnqUEAa4+swcI{dJw
zcWyMjgRMlN&U<g5P<@N!_cW~GSMH{EmZfR)RwA|SoaQvNkkD+a|0>@`Y97oMIi<jm
zx0hKUuIfQ9{<{S&J36*|23pVyRpt(pN6_5SHi1fvvn9i!$wU+5XoXBiB@~ptcw%2(
z!RbQ)9@m^V^Z_!MbkfWnBFK-`HZY0WgE``Ry!Os9Y1e?3m+v8si2S%IwT=t`t?QIT
zkNgQby>7!0d<r0PDO2}+g!}GQcR+H^?U&GsWY_5feq#yBf=2M;<$E3i$UX><{2+vO
zHfX#7t~dO0JvW8Aas8f>6UzMU<Y_!$5z^d02V9oSSLPS->1N~El~tBX<<UIgiLrox
zExB{1khTYWFJBAp4!@iZ3z);^wub2DclRh_GMN>y#VH(yz-fbrAhKGtY$=A&1I;-b
zXwPVy=>p`|MBx-0c-6NJ|N0ZWaOB#8YVSk8CKbGXtdV_C-sw)TG`tU?ONRWLhS<fz
zs}JkJDq|M`;rA60+|_)fo<#Us0C*rBZvQ#Klt}+B0LZRtD`N&d{)m<3*?tP$$V<oW
zJ24;hJjm6cnIL!p*4P~a$Qio;hVL-H;Bx^)OA)T48<U12gphEJ%P@A|`*-#9-oDQg
zAo(#IG~<6*3-`J@5_w<HZhEpubYa%ru$k(;gjSuniG%}UhM54f3Dk#Jhi`Tc7H9(6
zLpgk1d!K#{!#&p!l+zGH`F%0Jb_GDfd|ggV*<p{rYbsqU6J%ZZ%1ZBt?r@f!e^A8&
zEC0etm!$o~Nyqa<^FTOeICyxWrT1-+hdASfFv_sD?>MIA2kk8`BO?<t=g-{nv*QpA
zIi>^vntA?;{z=1epR}JWe?M6!^}j&F{S)BY*aLr0_UN!Z=L=*G0?x+*XhlIrezWib
z!pu2KsGRpX%JIYz3P4{t=?l3&6H1VxX9mQil3q5MX6v!0Zya)bkkAZx<Qdu`Ulwxy
zB~|rxXr5?D#W|e;W5mysg0;ZJX5i>%2D6g#dr_g#f`~XeK6z+{Sb4Zm-8QC7`Es_&
zfQ`gs{CZzl>S<dhp<kQ+{taLYFxhBO{4XKfe3)~g5h)9~Pgp#ZRADiR*Wr=kJO6ib
z(}<5$VosVV%?|fOx5wYV<SlINqiI+W-K<v-Ig~8Y+>KiL$z-=2ZgMAw)S*78TCyQ`
z$1$~!HboQo1dwAiMqG`-B_m$N02~2B6b@>{z#=whs;RZ)<%5X>cmtFQXl#J`@dCnL
z#qNQ!vNES>0Y}7AJ|Fi>1{J3)p^qr-q;kL@LB1jFlDz?eVXR1N^fpa^1r<+Fem*Z7
zJNxIl)Qk-F^mp%q3k8vi_Rl+L2zyEnv#0XCS3$<<S?OWo3wA)s0T|sZ6q>h_4U?5M
zUPt0UX-IJ07F-Qm#UN~H-y0;{9t6@%$RD->cUY7;l=s}P9-+h8kehc#zP;&v3b3s!
zeGtAn=ripxiAxh@GQebGZdg9l4DX;rRht12Z21tlg0ulQ28etxiIzgGz4U9wDCW-T
zwsX!fm%;`*=w2I1m8UzZ!)M4AAvX<VCd#oK?)R8b`lHI6p7K%l`~0V^!#8cXUIhmS
zpD9*W33(M2Wir*Do@l+*lb%}NKR+&WOX-oDmO&cdNnSJxcN6%Wg=J)1%5xu-aE6R2
z({3&G1vCF}zgZVChy2+hsxj_F{<6c2I{0QU<y3E0M893DNC5EJIu(lSn=6P6m09u~
zG7)?;4Mo4FN=es)oJhhK0e<z{YMO=pSWRg}&N4*AV)8{Qk&g23zc1%0+d&$%-D)BJ
zBo5dZps{@O9IFzx>Hn1ozX37cLBU)U9gO<>81HZU34(Fj`O10kZm-Rir&^~mhlnzv
z$UMv^LaCWMx?X%P8Izwl3rzTZqB}l$$~s-Vi(-H1z?8VUXRokrL~Vg_YdQb}=&d(k
zW&yJ4eZVmTQ6fB<+2XYUVNY`f(<>-(-Pal&NGu}wZ4a~5lR4!E;|DssOYS(K_o5e!
zEioTw%=dA7{@!CvXlV1mStH1pAI`53ZYYhl6fy!m1GvHf83E)jNIEbyuBTx+f?hO#
z#O>07e3I!@Xr{>n&>#qwuX4icB4>H1o3J%*vB?g9<Z67zz_O1Ot*Krb$95lk{f`6j
zO#kvgELG-v_6o^)%`VwSQ+H6DF&eK8P{6$i((xn85%&OMPC#}!cJ3KQzA^E7`K9)R
zLcRRce}c)t1hZ6ApU;^tWDeN9L(m2d3kX?SG!oYeIl1hsFQOCN|6PQCv?#G&)DJK$
zyI77T?#Tx5k&C)^d*B`?bIp4_@5yUUivee|*PM_&4oI4%mVjLaYXo@STR{8+TN1Xx
zz68Kn0ki$UWx(s&T?IIP&vq453)o#<8gL7HYXFi2UcyqYZI*KE<{^m70y1NNCSpI&
z8}i?*Q7<JOM8qQv9o@_bQI9lvhUS)1@E<O^w8#1}Sc4RXauyQpKtL~+MDJtbs}1az
z@ut-VY=^Y=%AkLUp{BB3KUviG#Mxg4Nx+B{UH<~wEwQTeLKwizrM^MHlJK2j0k#t7
zF<_iooEzYWct<2C4!VVVlYwgk?}WgAdF$%Gx{CfKyceVKI$N*xHF<o1iIEF(UUuK`
z>BjEkd1+W0qwS!5C0Bqr3Bt!Bh7+pmh%cP_U%-^P4YtGpW#**?ys<5qUk->PSUJhB
zCcxXHkVMjb2v8izyvz0GK*|P~z{i46UI_^y&i)jHjM#l*$$xe0q`z9fz~mA408^F%
zqWc-TG+pSj56)&{xR$ojK^mm%o`O_fBVCFg-zR5X)*L9^1Y1~qpF>s8%zngRuX+P2
z{#*6l1mpSl>J45PHUEhB;T~O0#TW<(_)<QQ5c&R|(tz86+iP#gJD~}r5X}ziLXrC1
zek%UIx^?+`#ymhAtR2AMuQ%oER$<2EvCpNqQiQ0)#({h`41}$3u{~_d|94r4_w+j>
ztE6PPpx(pC1GdW~eFL?$Vu)#DUb}i>$Uy#&-7vdAEKN=@@;rS8`FVai!^D_ljJK%q
zW-ao2i@2hl<Oy+G->Dw3vt_Y!Z6A65*FN&x8;DFG#@9Z6FAhkcr2Hrj-S%Jc)ISzV
zaLFHw-q5mp0oi9keuJG=A!+z=$QvyhZW6FmQ2NkwkA({lhb-Wdy8nQ#wdMcZ0&|li
zTwLw80zI!JV){y*z{;}WvSCd^q_U1O?T&!ZwcuBGFDB(DD1Vo?XN~Jeznd{UY6c4;
zFOXB(no=-Eyo@_vy)i#W+}mcA)8cvu^3osmJ60`rSc{3|U+DG!4_&1%$YT1RJ>>@f
zkbNlFD<kDuENCD>^NJyyJ0j!3X;T(i>GK)ct=YoBmeJcvL;SuIMh3VpBuy<YRd3El
zK&}g;k!!yI#+;F9=b!z`kparPwnbdr7Lj`0sebE-%6rjn3!EAPXArT++CycZd<+2F
z@2yO2Un}Fl1Q|7Tmw-tY@GW!_0{}TYkjz8)cUnRG;TWsj{rneQ0L6tGs=5KI$G1fe
zOOAq@0*O>DZuHPUx5s?nK4Nt6z)6JmtqUO%zuE+IzTyZNBh>AKX@2#MH<TxD_Lv>?
zlsogQy*AIc7{LvPk4c+<Kkh$S`RDg<{-%ebJk6{5Yx{^Fu#dQeu@?W*f}-_1pyBV|
zt1}?~)#cXl{PDjxWWUDpfBJ^BQxJ!|lk-axZVMJz@R;?5rr?6OP8xY0U}wKy=g9Cm
zXh3W?@-!8d_ksKG(n9AWI7upUIxU-Gl%&VBn`4GP?mu@8e-dD^X*?ktAuI7EA}1@$
ztfSq{?GLtNc>iuAb#7*6Tf%St^a~?3pTcmBQnI4qIpI8^8GX}|C)n67h1)g?HKxq*
z2L&Y4ox}2%FSgH5G`x=&=CR;$QV&<>3AC{4YV>PNwwvHGnDF<mlcXyV!n8AgUf;N5
zPn<L6)yE&#)GFr0n(H~B+mLNJj$*wi!a$pKEWJM-^K?Xrp@In|Vu>!jHe;xn|3tdF
zX|)_>fzd_GUcF0(8$sodv1oT;YN$YNo%(aBZ^oj5>R5TGi}v<yzUgw8Oh&7bEW3JZ
zo^nRVIZ;&?$AyLaVRpR7o~Im%vFh?%8dE=3jT{PO-4X5I##xjytHT^a0Dm4QS8AlA
z!txoJy3{mlaMtUG5zC130KNSdb$UidFcvYuc9IV>E)f^O1;5}|q0N|_%&e@TaS?cy
z{Kqp>ST6X8`>Wo+FI{^bBa2z$^T+4VOmN4tS~xEwPanShRPRAWZtkM>#Z#36Zp*5N
z-Inj062kFwd`3&OIZiuKa`v0tz>^p1R^_&kljjaLKPI?>8SdqzbJ}qY*UcKl36#ik
zrM1<nZ1+L?OD9{c4>0(1y_L+KNJ|f+KnUMQ^gc1tN3){jou_`Mb{$#2MeibKGAz85
zcm^JQQeZc2k=LnqI|SL5<wRUe<(-+ct8Q|f<5O*Dh~ln|fUl!Cbyob}VTwbJ_v>M7
zQl#Nc;0|X$Iv9M+j(ca>U>)c9e(b~cTKLc=KJplq6{7iW57xT-0`KsbKdr_Ov+6n@
zDP6`Nt_-BRYEV5W6#(<b7j4|=`a|)I^KzCjv5umWXO7v5sCW3$lcA*c<}izL7^k**
zUSy1YgU`@n?`ecZ+44Z{dlXL8@os8icgBP(J8pXJ1J(Z0X>fP&g}y>~)J+>&*Kv)h
zPW_PMfx6p>?w}Gtnvsc@<+B{bdJSZL&?Xng_7$ttN=o6U?_wj$og`!$Wui~p(8S$2
zH~{>Ry_RLa`v>%Q29-pVZBVhXbD1cAF?&WvX=loAI{I?Q^@+`Bc0h;7cIEq|+>0jz
zqEBhj#E2gp0G*o!Z)X|8WM`X%*P94Tqp-ay9C)-8ur~rOGT>td`&r}SnR4&jic+*z
zf6W$SULDfy-YvQKENZ<dq~$op>dxZ0X--<jpSb(lpqgfywHmZs@xZDBV%~8PSrR{0
zDHR{O8@=&j>z(=ufr*!5@9=oO>G&NPA(tvj<<naacUow&pV;73Y1Gcft>bp<5tt{;
zrtez0`<bJw%scYR7iLuqL;U&QO+5T}H}Cwk>$qR;CNSE)y_a<xCVPgi>>c40Q2OK7
z7O4FmHAJW#t8OhZwlgts59ovCB)wmm>EH(sx@{?uAJ8D)zoErHr{MqOixL`RGaw_m
zDj+<k8xj}K*)A5zeNa#fbx_vqvWeYb&7X#|udevhZ>P>Q2iNXwzrNe3KyeAp=x9c+
zN-O`{Z>+P>GX_u*Iu5g+{Nq@;XS2)hOBGKq9Xp5Jeg5F)m$DPW=kST{COd+QTatvw
zBhz<&)3aM;^NX=}%k|5Rem|&9s`xS&^X%<AuwQ&cH=lBU$BLw=<JYs>iSTo?t1qa3
zR$wl!AT^h*k$1Z!yPHkMN|Yg<P;k1y*kR+~#0Lfnn-23iUys@1%IqmbkV>3@Ec-Ez
ztMpkk)E!FbWFO_?hY>3eCx=k}!DEG#)PY^{aZD$58jm%MBC9O|f|Xs!gk4zI-!i^d
zA+R1nn}!xfOm&yOZgUAeONF>TH`~5@KH4JOf&M|P-Fi{pW1n*OyHp<7lkWVx7iJw)
zR1pD4@t#hqOJ&;?gi(LgK)3*d3#W*Cttt|aPG0G?@(bm;keQwy#2W9cG_X5(XMM}>
zV1AdDsZ5|eUvQ;6;uZHymNt*|E^#7u=vb3YGY0jjj3Q>FV(HTs&sb67iHIf#^K&r-
zXM23IdQx{vbln=poU286H-C%&Zsu{PzFbHCUe|b$WYdTZzM0tbYs{jQ)y?jQy%4KP
zTT6pVVO%a<vIu(Nn=9Q}Ua}HTEjQ<d<~^;ujN(dcVTv0&!xQ<PJjmnAXXbX5FH1FP
z?>b8%cgMPh(rPckXqsm%q8QaWJFR+dZPp9Mb_MX&m$pnac1Y1j6n5#nZ=Je;FPivW
zb7c-?HJGzT*1|wdG#To)B5a?KHD1V^on(>{uOFJIaAP~98-GQ`WpTO5ur6Rb1QR+>
zW6=~$ean8j%_4K4EoYv`VA~uPym{?0v#%e@O(|}^OiZc^W*56ao>KXzU0N-3ey2`A
zNkvU1N6xkslI-k>bGa}B#w}GL*NU-#r`sR(B@a=Jlw=y5mSrLnz4^#>C2#9-4QH#;
zyBQlTStPz)d#%UzsTDl-@kaUK)OyzV=3^6KT*m}&I&W?X7pzCa=jY`P-fMZzP@yp{
z)?U<2+}N107{#6#_ZTpSwMsN5D9&?Lt-eq!DLM0L{tX@S*bIvPG!=rUcu>xMqc`G@
z?5ktw`3Mh$Yi~|YyWSUjhj|joTXy&kX)=*X^`YXCUF^E+iMsB}$p^7VAGw>u4EsV_
zyvCB2U1#z?JrYU2bGbsjMV^mrqPnX<wcNOb8^^uF{Y2=|LEDw(H=<@;rtM$&n^57V
zPWD^r6V*LuOGbVJ!k}<Lrb>GO$@rT-PNQxzVyCXMuI?GJi#pxT1)@#slOaz}SJ%+k
zM#LU6kEaTp6^La1{qF=TIQ0h?IpS(rL_-ooWPN$M@8q6MH2#MALR)g98^QElNQ2Ys
zwLQf;3j<ehyy;6y*~o5y!%wAp3V$WMwy27eZ+NPzt2SPDl#?lBlM{m2v~>CeX^VDz
z*Q8fegGaw>2i70o{&=*jGHp=O&e%$SPtl&nhqcZ1-|Okz#HlC<vW(#!c6TN!bR+u1
zWqQ;|N3etR@QFD!uDjPMI&W?qaHTQ-!e#$1+i7#oj(03>v)Xw@cf;qg?h%`yUC*jT
z!%7i@txx@tlQOFcRS_2f`n~Aeg$_>7)z;Kx8)=Tev|O>(@Vv`;+uUkMAoU=nt)Xl(
zW1~IQuEa{~l$W1q*A@Iq$n8qLKE7%2dQy@Z*J4|S^_J-O2?o?OrKQHvg9j}FMOI__
zT?neZ*PdN-T(rY^TmQvkw_!QfFBYrQ@~C>Ql>j<uMoV~tTehglDL91cB4X^k-W88G
z@Y`m*NLyFW%NR;nk32b>GaSktltaoevr7zV8IAGVp~WvpyAvYH>~I1)-MgwfF&hgb
z3F~6(9*H4Sr0PIBl)uEi>p&FE$K_%}q8XyrLi@q{AWL+d2I8l$=a0Bs5ig%iko3PH
zj-ckf+&|Ij+VU#XqKH|?f(ZXus^^d~&u$Xud~3Ssi<IlmN-c%k6e*uPeH4k5h*1NK
z&^V$f#&gH++<B>O{Ffv;*!qRZC$yX1VxGpRLn>tAA*)h(Nwt%*OXs-7aHSD3wkFs_
z-ag~Dl2;~?Pw`XvtzQ0$lNPbNm%^iH2uuN@Y-;yMzx?USyg92zFn#us6$V2uO}l#7
zF1*?Hs^8hfllS>~U{|~5Xm!#sV3$;rb#tOvHf_P~K)p?D^U%_p#8(;aZ-gY4$KtN6
zJzM`29_?)z+F)K<s=S_pT=7nP-;BQIG%8n7OSNiWMQoq(K`V(U4{eHBe6|TN)z;-!
z*G0q?kc#7siV4q+mu@bM$YwA%^LHZJ_RU-O;eSLPMMn<E8ny*~Ho)14lOxoFjkBt<
z2kuOjWpj7SMV-&Eyr#n_pGIhLJwuixYl}<y)7$2$e8yPMgPWR83t?pUH`|G_Rli>r
zJhHIe%fNC1y*MrA?f(1K&amJ^8kPWQ3EtI$-&XaBUS7Jk9rkEAtlP^i;V3=3jQP2j
zrD}N#T|)D+NAoRj@t#st>)+h2!_`Sv%BHLKbVv=T(c;g&>?w1q>Xlvy>PaHmXiKSd
z-#F}culDKbY`)t;ACfV)E7-K^6K5zxcj;d61|CkxIqC&0-K-Qm=TgzvO2o^j6#AY`
z9qZ^K5rw;~+S+dvN8Ap2d~ermtS51Le7Ln%oV#>3hgaxq^1BI9;$P10L1iL_=3kzQ
zoF08VK(*|S@(OP>q>7{be5c^irJXo{v-R8&jjJKSiFcS5@3&y?t@wXbr!zzAy9cG0
zxE2U6Z`l;vH(-qeySIlEa>@@3*6Ht_9haWyZVjr73S8z%-|Vy+B&#@0SNQr!1F?RP
z>N;hoT3Y$}lhcKt&uND?dNi_nlOn^HD-X{yX`7cvI-L$(E?|wLq$ACo+9hH>4qkba
zFvyh|Y1v`Dds<IDuzPDx&_HT^$D3g^{lQ96z+atX1!A-`J8fxH;W<>!G~ws~?(Va`
z!y34w=e9G>(svA2JQ;-wdeEQoO`AG9h;6R7C<>l;nJ4H33lz(TQ0XP%GQ$2I*dvwP
zcMjG6HHRXZb}1BIuClS;_D5C8FESkDr9`Ysou_P26nlKzNLJ`*U-M+NP9phAx>Gwt
zQ1gw6hnh$yd*Vn#jvIq;Ne=G%mZ7HW>=)$Q+7ueUorT1_EZK{*(<SAX=LZM9gArz!
zhGXr!%q<lw87$q=?%J--^wxa>dL_O^cife>Wy815D++JB2~!qOm+07yG1m+DR3F%J
z|1rcYxZMOadkR50a)s$?FX~F}5j4kC!F@gT)#J`3%JDb4Qps0&$|uXZ859^8Sf)h!
zlPb2c)UPOZgKixTTRnEDpGzC56GwVTQG(zq_)6AO55}m+zjbOWmGE-I#yXmhxw1W0
z<PPkj3XCoPQ>yH5z+ccdt;|b~Sk2R?bEXN9qhoj}M=Bm-<b#|dRKP5QY_=>zXY>_C
zsRGja&7;d#B}Jxl_}GJ|mjW|+6ay0cKC;ktxlT(bhCDPX(qDk<43=CwTf^WV&^fng
zwip!Mnnx<eq^B++MHhy8blyQiwm@EL9cF16`|7Hr!g&u}EmjY{n0s(3|2RQ>)xx41
z@x>>7cYfJvo$HHKH)Cyg43~QQTdIXKdu$qQL#mXT*-r*+C^^X!OtnUF{5WnhDM1rW
z@q|3z5Gi_BlQuj{<;akrn^r{H2zmSsm;_9|yVX};GSFAf?<g^1XKecE>GwwyYU#Go
zqexW_OYRW`8VUt{^10N6Zs|(T+fsKJb~l-BlV2`(wHDX`@u)9-u-~Y4i;Z>F824ah
z`oi;@R9sw<`uuSWnOn8`=weG;M`L?bhH3i8_M%+0_2p9=b%zpDd5VWE^!g_QxguiV
z{Jw%Jdi?BuY5H_ILaj*Ea_sIG{RG#Ikp?(7UHs|X)z{B9ZJMcBS)~G{s<O*z6)=Ah
zRY_Zs{_d@PR0k80wyi<9K0c$(lsO%zR<?^^dp$RLu2esN+t1=L-QVs0=7Uw1ldEDh
z1BppXg6)p!avMRBv(XKxOQd@Ij2E&H?1v~3hgWgjr4`+dai**=9Yy_C<3)PXL;6!H
zG1Y55%pF3*ObE3^BK8Wa_jwx8*t6ZFEA?&1+#+;mPEjFFh^>5hdi3Md>cCwI!Xwa$
z7e_R66akkd8hC%5i$YI*A~6PF!lAo;R}}?XhmsRjY<=B`Mk0?>HEypI5#!y-(XBe@
zpdOos*ZOYuB966d+1maGvQ?{mn|U^CukswR>p<Nwaqs9k<%3$3DoxxTS^g}yUaO{;
z@7saGUG1c1rlCtrMA&jG(HYY&77vXJjedHtg1c}SPxImhT3X`MQGtz*?YD20fSjy9
z#<MG%AoV5j5H~lA6jH@mGB6i@`UOg`HnmxLYa%l{q6|U9p0hpC^fbzMQpx);J=uWO
z`e0)I%ojStQ43ePC_fFwBjOugiB`4>+S`TM0_ACMlC5{vj?%yXqHwQT!gG%D`DFjw
z?Q=tQ*zl)YY*l!YTG|WSC`?M6cF^UXdmZLJxzYYxsEhb$j@gt<Q}RSrl`EG%yKZq2
zZ?T+}pn)eCOAd?OFp%x>_vj(sT`jWMxD&kd#zy0EOM9-!bc&cyKx^wF=|qwX-`VF*
z?Phk~i59k}v$=O2=iMJP1XOs=9G(-CL*VRF9onyX&=61jh=LEYe?%Vn(fw*}GR<Zu
zwMR+KPE*ve##te5gc)uPD8^6IiHyHosIOUc%|HisKYwDWXNNE48U6eq15Mn<%4D1p
z_0MXTn_hE0)Xq2!mVZ~&K4G~zSS^d=)3&ic*aw)E*FiHXK%r;1w8}5La+`^cvioVP
z)Eisl8%LMi1sD$AS$XW0;2UracJ4SPu;p>IOi$U$)`M&2PsE?vWZxZZ)7ug3uNXSz
z^GR@ndq+9nYjX+$Sk4i#qjuhOsumGMCX%4s&2CeRqYT&Y7FN*H`cyWId(}sHt}#Bp
zb}BHDJaBXVz4yv-`eW)B5U86^L>NzMGd#O^63+1Kn$xY&@-G?bW8s)xo*2RN8)KXe
zEdr0XE}TZhJB@!zs&lDKR`(6RbCI!jIW_TgqP=mVwWMJ>ZkJk)>8;A8ByGmuFVjVM
z)fRe;D3T*+ny<gx5l<9CVIFY^OcgPOaD!2>NpeT~6rqU{(cW2j37!r%p1))rI>@1w
zQy7vdtD5tkd6u5SM&_EiZBj*ZH1=sR*K2M`R(xO!oQ?!dI#JT4pBU7$SUT-@p6AGc
zhp{d!S~h)T&h|;oW3<~hDa}SG_N^zwAK)<BRy<+SV!R>FG>Lw>=wJm?VC7TI4rumQ
zJV@O{j<t_f;AML@e5GX9=NP(ma?wl0NYWrN)oXPV&MlzcHCL*j+|$XLXi>iAYt%jZ
zSQhNq{r&zl@P%i2C)&Eyi}%D{USzi?xC>lJQw=e9tuT-#o?S7oyo7|GU^s)PA~7U~
zW%X|y`gGk5Wj)=WSt9<&t8A$Xrxc24#^<u|{3J%h>SX3Bd>opLWTM+2<C`M*rQmLl
z|B@KkhAlC1(Y#2URBx-BJ=SDsl0rdtrz$xlV1~AQ<5}_1?kJp*gNKp$P;YAN#puJ<
z1ir#a8a7+=C?k*DoujEL4E;`6_-%67L>Zm1(P4p&7u5!%lX*j1C8z@!oAMqbgXB0S
zHBA;1ilNh|O5__^cb3w;TqLd(;BrNR#|ECp6A63yX`Z3cM%6K;Q=57F+uDVL=czno
z;L&!bomjx_UXT-X?PqIadQHQx4Y(O{MZ(g@yPpH?9x>_>P~OK+NR`wspOS}zM6h+V
zwY9z6wo~{(VJM=SO>MY#R`}T)T6^M!#fx40bOGTDCs$dcqkP{cf9vD?bh;kcFas@g
zZl?7xy>%P)g;z!=`vs_Uxfxsq`JEEf<7fR>UJ}a&sslxs?Qn#r#O&bZmW>gaH)7eJ
z=64g=Ruah3Qy$p6C+<<C7ram{3ATQCDj295A(yn~WiHBGpBOW4-QsA9v{Uoph9Tu7
z<5l@vQUYYK)~E|ZiQ6SyqUwG;Rd^Ud^kSg!j!hZ4YgB}h4?VUk;xdd@&f+AOl6$%_
z)xqIsYUht*ZJOe%i_I9XsHX-HN8+1LoG4~H30I>vH)-|Tu6v-MYj$~cOhbRyMwiHV
zIaZO+K~oEjm~&e<l=2g$&(my?ucnep$4+X%0$Y6E;jY4VcwW2QKDgy&-J9~h{Zv3u
zE)9bjbuXN_ns9#Jc6QjBgMW>wGUGJjeb8>Fe2?0iWmkH`ZT-@Mf@^HEe5daw>L&yt
zTaA`3iA-xq(Ro~giK+Or1dM0XUmt$;z-{L_^aPB_*Lse4MsK<T`0K7ydi>@Z@TIji
z^n4>zpa@;FdKN~3`l=vpB@Hgn_6JA#yfgl0$L<rE9vJ2KMN**Fvt#z};+|#q0W+3_
zO=z|PHjU>wcrX&lTl~{ImtnV~`I6Z@u|`@aog36~{vA(!6uqg-gwojb_*G!(Ljvo%
z@j$+Drq5c^W~su@Tz%94&ndpLr8bt)$a4fvr1VY+b1+^wm8THfb(G+fa^YT3{#%Xp
zo!LOQh}6!e%3<)_#xbdb>`kuK>k^4nQd8OtQvNq?_^?Dhyd~8#9aFNXl+e1x+lsVN
zk-O-BUBf3u<3&JsYw;b#ECW6{(cV_oq9AK%WSreA<I*`X7T%mdRi~X#ZcmRMqRgPt
z9*9{F(7Cd{aqmGK?bBB2-Vr|q>MLSrW6N6N(7pi$<|MU~twE~8gB&?!7rM8$<A>Nr
z9zr#6glE@xg1OUyZ)sP>1GXw~E}f20aYeKQe$gW(%J&v3HA+^9J(Wn?vypI<5@y>f
z<+P#{Z=|_}B@8(!ZivL@(zsTe*yyn164Ip;$Y)#2H`19V6a`oNpJsUFvC?v34)7fQ
z!mOgF?kdtn#XRkI22*H8)AwS>Z#txA{q5l_rwj0cSjGJd7k$&(6V@crK`_Oasj_U>
z$*q~aoZRA}I_L(A9*oPLx^*Xg7U;VM5?=!GB?ApRj@8@rdu$?`P0E^S5xitxa4-`g
zaeJ-*LAMRMj;$qzIm|N*+V_Eoui=A?lh>5k)n~0N`><pcW}%!pSw{}Rld;LIq?PV|
z%DVShP;@TViJPQ*q~b%LyT@9XD($;2new#f*ypt_PksnN;~g(Ov+P4ASkF!`NnaKu
z%svRsCOh74_hl0OmyKX?qKnf7L<T@bLT)QWlFDPr{6}>;>EH>QVr8}Mjv}zAQwT6`
z4o~P~ng7b2;Wf5p1ASfAE#kq{F|-Z6d~EenlD?ED)6!|Ji{?`snyCTgu_|kR>+puD
z3Ary91+Jf!DCy*Jq0i>o+Mp5G4X*GAu`_k!0r>L3lh1+c>Wg<hxwgk-cqC8AJF>?x
zs4utQd$Ga!`svoY2UUwkJ{6xiMEg`x42#k3;;H#Y_)}#?9DTdf6>>);Shwk$yeZ7k
zTM6$0A8DJIbILzPZD{-Ro6mf>cTz?24DCfrQLYDge51H%4wDijZv8pXldu_oQtr>U
zmaR;$`H3$>0*|Gdf2rlACo7sfHfE!AMJF}Zh@_S<5YI#f(<PijkGQ&e%z|wOdJ}q;
z5%7BZ2)UzX(*iCTxtlB2JU&M~O61D7ZflxmU9VoP*=Yp5m~nR6@A#^xS4qqb2ZImq
z;AKy?RQ1$_4zz|cnh>#s$9@XCZ)LAp6lBj#TFzaZNf2|OU7Ojia!8EzXxw#x-7tG$
zZhC2U`ZNoB-Si2{zTQhOR`Zof(DS96&nE*pO4815XX>FnuO#r<?4ouFE<HZ2H=gW{
z1fBpy14K?P)KWVeO#1q@NS7bEnQGn&FJ0A1KQRA=ZU0!Okws#_IQz)qdnf;M191C#
zaGlLLF3pu4g?Y;E=^oL!A;^ErlX*tQQrfc5`5Xq?NHh~>6Ydhbk%FBAZ~CpLIfe_a
z8V)Dv0CLllc6$!$&Qyg#Iokwju%~Y-UM|8dA)GC{@OmNd(~;-Ah`QIR;~~bbC3sHz
zSzO@uMLoNmxwT-~KzSbJnR;-EQP~8}*3j1*&chNT;yCIAS#~}3_LlMo2~JDBrB8p0
z@I?!%xpTJ~>B0g}m>bLVG^wg9Z*oqNoS#j3+-`ytuQJ!C9(bdzUcBOVwHh|eWOn@)
zYin1;+o>Gik|)?yRE$;Im7$Uyf_HnZp8|J|AK!0+6`4mB*k5EENdWyQd*fUaI(??(
z9m@Riy5QN>jNveD?`;QHYGiHmki%BR-K4exn(UHy12KiIH0-v~3iT(ihi;Um8}7K}
zj267-Iclc@SAF6eKJNxzl3O&LkZ6>HUJ5o+A*NT&B)b-Csh(_?kgA@(E6c^u6sY^L
z<=A*@ufYgu^_>59YQ>I!{8NeGJ9oHA;qSuPr08xrO&9rzAG`*;=F&A?l=Armz;&G4
zs(SpQC8{lnw+qT&D!4v>@+7a>Rn`N>b;n<5?$uPnl{aFvlR588z_TUQ^(9=(x~<dd
z(gPDEc>3Gd9zq;e*;5{eSyo}og?M~oVo~Ca_7<-y^NS_ZSNf>wN>p}7Wyw@X&?Pu9
zU$cTiM@_w&2xGm(?>}MGiYi;1E|y-oK0=Nb^xb}GJtL^3CB{cKEor&%uo5T`wBr&p
zfn7s2x_qyN1vvIe#+j7Q@AjB|P8UH?b9yr%-WdEHbjyY8C*`TQwP=NnwZa$EV02m9
zVE<^WknQn};VB6Wq#(<}%Nc>6l{&Dm^LJ(7{>~q9_%li0*t<Y;ePy%QsyDOJ#xq$0
z`sdb?>tWZeBzMIcfNGp7QX7*a7TV4rEPGV;=vDf{%tTuXHIm38+$W$GmsBcGDXcWt
z&es7c?#L4PY*4xvZ4B!(%7A_W7vCqv_2E+r<SD5Xh*gq@+e0@a<oTw#sp71)in4c;
zDG+KeL`Gu#LZSi(m}bt$PVOkiH;9Ow?WZLD2qLo6+AxD->I!E%6qDm^8OkHW(j_nX
zo&HQHKQ2w<dt%%v^z@SIvtEmNY)IlLqxMG65+F=O1lSeZSE=5H1PCeD91MJ%`G&$(
zSm;#ra0RUda%H*xv2LjLd?`Qe6(>M!j6_$hPCo39X$|Kea8SRIQCQ5Q=%<jvv`g<a
z>f^B9Ek&?x_%l}OM(3%r^(&oBJFQHki?!V<y>}xJv-OX?nC`3HyRRouKKVkP5{a0t
zh<zz)BJQM8l%0SJMW-HO%El@9rj)!@50p1BxE%XYQeLk5B!3zcpKTur9V~M!!_U{}
z@GLqaEf@2&K6C^Hp1ULUEQ5HCi~Zz|ONYg6CCzs8%}sa+RcOt_skaXl9?(hmyP{pJ
zs;)3GSr1KIZBdL!KOq)Qs}wgK6yk7ri};Cmm&@Og>lme=t+Er0Ok_blzeN}AHRHe7
zN~i3Ty6ZB+RXp7nEj~h=4Dvpx@}NKJv_c{2BuZ`mo>OP~(P6)u>dtN)qeZCz2Q>{l
z8H3%*&@Jb3o|sdk?^G0zOKw<%3(L8l+?b#vG`vLZ(4<VM{I+rJFYa`wWBdnp*)k{K
zF4xx|UZs3s>oNr=#fZclz1XKHw(Hcny43Z~?shy)jnRtoOD{2BBdN{l2h)MiXiWxC
zbKU9zTi6RjCrB5qbIE=@33u@D^EB7~*QmwcIsT@6YqnrWCyA%<_ZOeFAupcP^@}?F
zOzn&OMH8^=lKt#TyXe`i_LM8jL&##;iF$2ZDP2Gx*YOnROUE~G{#@*nEN;t_M%b(_
zJQo(z=~^n*nfFcb&wkpGtx*4^qu@CE<aB&M7hUV-J?h+@we-(jvX0~K6Qk1+*&(;-
z3Nt5+Za-7IrM^O2X@vbQ_KP@9mCJn-`)!A_@f{!SZ8i?VR69hziv1geEnDrGT?W!;
zK8l~-I8Oc*g9{X3qTRasXysC`=(AINT5X_Az~W2FxAB|RsSZrH)DI41ZLWn^pAb1u
z`+=&rmAq1rS7ScN987tade=XTt6Pz=T#)`vkKe~FEd1n`L-x1MpPSYRA@z*$TFb~Z
z6`vUFlzM|f!4rob@l?#@6dWtpIr}nq?sZIXRpZO8$%25AF5`n;Qw4}JFM)Pp2_4lm
zZXO=fr3ItiajOo$)(E&WT}_Oy`F+2gqv=$dbmTGhr^ag8cO!|X<}wpU3iT70Z%b7q
zNn%{4CxV&9Ja}X}l=|d*@ALJMP1ZTj9l2Imv5{it9nfP=LCj_}v!)Vx)XMLd+~^>`
z*{Kt~xUKrGt92upIk_n+pUH)DW?y+*mpC8to!|;c3+Uh0n_3$5>1}wLWLdI(4YoO9
zSm{^LWu!hZc^B)&XETc5XNvKPo^j^+VT&=gNir{UcjFPXBJ?W8MWCq4IT|w~`1^I{
z9qlcPSMa5tv!#o#B&DXigf0;ifN8+RG3xVcp*!LCxlN0T2MCB{vt&5ICEsGcESff5
zd;Y_qUqFA^oDXI!S(B$R*w9u{jK80CW1!s3u{W>fyns_6j!!_DU$ACL<?vwWp@g}N
zHe24-FwW(%OfwG{T$Ze2-we4=)Hwg!^ZS6QMRlGLq4xek75{86bAphfY5frYul8?$
zF#$Ca*_XgNvhQyG^ygnWV4`&964=^js`>dKTF_&k?`y9Z(EcDPets(TLfCIr**VPK
zxSxJ`-$~!h1Sg6y@r!$T=jZ?V<4EPFz)RW-M;B;*br7RM$k1oj8e;ilEcj6spl4x!
zPzSD!@^D(0UmheY9E@t2Tn@bZ>Iw8ef1DIi2C(DZ!POS~Kiv24H{W!E6E!Q8P^|gY
zy8R9Z_k2Ukib(p?FYo)20xfW&S;)!y8^2n&L5|=5H#q*U430WSkh9^Ozs}jEsGIZP
zy%)^u9BHKCY7a@6ew8#Je_m07K+&xHEd5hq_$jR32|`w-0Os&tf5pHPME(8C)~9|I
z)4%<Z82}y!pP}!={Ohl1UI0#4%Fi(eewCnqeaK(}4{V>-cu4ZguiU&3wA4ojud@Eq
z>UutR8Zx#ChHJR(D<D7r`M<a2rx5sFS^oF7{O@h~*2(^}B-%ZpD>Ai|(7j0p-YxW-
Nw1k3q_U#95{||dUUX%a;

literal 0
HcmV?d00001

diff --git a/docs/images/github-2026.png b/docs/images/github-2026.png
new file mode 100644
index 0000000000000000000000000000000000000000..b908c8a4ed17044b8408579ca317c4d571a85f01
GIT binary patch
literal 60481
zcmeFYWn5fMwl@j^0)!AC1PdD68wu|2?rs5syF=p^Jh+qK?k<hH1b26L?FMc?GxMJF
zocqq4Pxs^9zg=Cm%WIXb^<S&Q73C#R-+g`u0|SF9B`K;51A_pBfq`{JdJBzNRP@7y
zfq5@)AtItEB_cwi=xAqVVQmTnBN?8kfvBl6gq@|MEQN#~=9lm%orILaF9BT}=1>eh
zF%}+)qCY6dSON!2w>8XAOhf3Co*t~0bx~;r{g2gpdTiAMmuf?ewIG<56S{Stb&mU&
z`)t<N45zad78oXOcor?j5(L4luLeZ;A3L*RGrB4H5Rh_Uu`l5D-~1BpkBW|l`SW(d
zw~=E$hof#Jnzr2c?p0$NI~+?GCiZ*SwAec%qFw=5KMoYrD{q)EmO&laiR9u7?J$>J
zCc&^$HBObNbTv-BD8L=Kci@Tyhy;^Li9W~*`{%@;w^c9&*#(zLXM-L~Di0kja+03R
zp$32H9cJ?jEhGNd)PA0CZu}$1*v%I?e-bC8Ql~=>#~jfwBUqylfssoP13-g|GZfXj
zj^5*Y8LhcyV<?wOk6OyxOCAf)Z=ZU(VRD*8XU;3T%jiwN2P_fSW6`=-nO*S1IcJb^
zL<@8d{DAl0M8_A(_%aq1iF-ja91CCSZTS4hQHo!H$k->WwC_hw6KwYORdIFTwf;!#
zbrT!})4xsNZQ=`#sr(y_@|eSK;g4`nDJn+l-XD8a!{AWJ!{gAcgb9iV!%>JYq!>oG
z#6CO?CRUf|(tk;c$o~Rs=~G58LPWr`0pd|$PT_IomFbQl=uEz<-4dCt?<RVO@O;^$
zTSZizkj_*@rY;+XJ1R#0;l1*HbbQ}b5GPyA@yHdN@vMo1mzM2~p8yfbII7a+9{K>?
zyREka*gHLa#d8A@rjL`CN1T^Gtc5h|xQV<4!eDsOkro7zb+}XB)%fR?xBkM{FZK%X
zhZz*2M28!IHM190_Ko>Ov@Q7M0h5$j@qHA^!8umon?YZq{u0h1^g@2_fJlG-MClLi
z@D4;sh|L$;i<RVrKS(fmgCci`F^~;0y9pePRBm6rfU(cR_FpiWJE;-Pzp=jM3m57Y
zG^S=w`5ubD)zQR31RL{G)x1Hl;=~kF`4S`%<l61ittO1Px%Wvb&Ra8KTL^Imji^ZB
zsqwa}{8s@!ksnylr6{u2USuPzwcDeqi8x~swWiI#NlncNZTdy$?fS|uSb-m`2>FpY
z4=UE7F*9}Z&iKkovro%UMJ95@B^-7|<`0lIyAnXa{>5h2!p9R5*S9?WnLTOMZ#(;=
zjiNN^Tt$OJ)mM66usAq%tbKX86wM#f9zD&~5>+|px!t&YmG5^W%y&wO#Me|8Wt+)a
z>9WUy4c;@S1F*QGj9WQdo8WSuUWyFtDvh5&bV#MQbd48iFy7I(x3|xbL=>L4oiRig
ziS`e4<|F>u*r+h$MA)>u2$ml-2$3$vy8INfVVPjDJF)k+->mp^Tp$XOychL%k9|+s
zb5Og%og8>*$gT<VLx@HbdCvb`6@oS5tRa9C=CdFxCoB+lze~&>YbBtx5R(^<Zv*uq
zj06e!7ny7?46|4nI$|%vCP{}R`bYm>(jm#uKf@(4C|K~d!V*YJ<KBJ4R}O@P5s1r^
z?8mz9P&%R=3hR>+E56VF)l$T485J$gMU8_hu{|mEost`sK@{iL$fRT4yVbzCT&h3U
z2WoY2J|TC;Fw>oyDR_Hf4opPY!TE-GDFo>eiH4?{Sn8o{U0`p#<Ia}qdrl1VE$bDG
ziVa0xSe&iti{=NGwl|gi$CoM(rVygFK;JKakj3E<191EmQUnLdWvM=44kPg(hawej
z*3L+|i;#cR62<?G=#3p8zSyhPYuYQ<>(jg4>$(MJ3<wuxA>oSkmQ*5#rO8&6T@qXp
z;TCTZJtA)>vx=1)V%#xwe5WPNNSYky79aBy5Jwy@pj=0-{s|!cNlY|VN=s-_$l|wd
zj<Yhqa(ywoDzPOmTY8J1wtRVRR>4|9$JC!cO!F5rVUw}nN9U>M7b+dpx3l`a(msr3
z_2=eKCDiTK>D6u5rPpaVbFZeIDJcBfpH7~(I-ojqJ3RlInkJv-Ef=@PJ0?BmIVO`f
zf%ho{D{v%bl=@o&^9L42rj~kY?Ky2;2LCzTa_RCO?fH7o`qU+py4<?!x@3#<IsU?D
z(a=1Ta?CukDXqL(z5Tp#ILiJy!>bhGJ>k6%dlqJej7sz3$(8BlIwh?djdG0=3KA1)
z042K+{rokI_7B+oHD;Gu&1G0+aAj6yXk?KR_7Y(d^n^+rTT@|;Ph_{xw|!3(PvD!%
zBVQ&%e0aPa+%lH$Oid<X_)GZxxbhq;*6vGHUU_Gd=W*R}6l7?TkX0nM8jc@qX{L3n
zMYBco3%#7Znr3ZX4|xua$RoY$<jdd6hm_(ORSJqLi+i2R51FS6t@+rKGe;QBvyJal
z@KS@*XvP{+>r;KcHZm(P0a(_}fdc`SUDbnCnpTs>lO`6HTx*UErsccm>YwPM)skjC
zOIg+J%5BQx%W!l!GzF?B8#k9fEzK;gG~_QoEy~xH*R&f;)NL>9F4)wxevesdT{K_R
zSTe8|BwQgR|Bz0wB!MCB5&bi|<g?3a+}@xIy?vQW+kUU(4|`fiOM6fLB}eDs1GU_V
z$d|2?y^Q0wp2s=dOlBjKAN^mWJPwV|Nu7(Gn^}_h+1*dts-sK{nz);O=y9~J*_*UP
zx#^tDZQU)d_UN7I@2~9|9mefdPi}KdBx8<g^>ZCdUA(`@*k3$(TpL-XTR--jH&}~a
z<63KN&yK9cqatcFS%D*VBKDtP&;DT0V3&5TzWzagRlwgMaoxuk#W(I%{&hf?$Clj<
z?cT%B$&YtKu~R1t$L_<qI|(-KN6n85*m;-<=&Bgb91FahtWE4qRJ{z})CVsWg}=KW
zl>9mNHtC2p=s8EeMoPzYrOm)5!qLY73Uu=e6HR_4A|z%9jy){LsmDzXhESvT#b{%?
zP%Tk<YTryS_of`A45vs`n;4r9WQCjb%Y`o!-c$0E0L38X@XPR~!ZM^}%xu+^mp00V
zQ%8Bx$hlObsrLMfOj<uzQiP?YWEWGXc$mL$wS;FD+ZOi~&r>eSrZFF`eCru%j*pQw
zlEskaN)eZokzUTclR~E``gl`tJ<U;YkL1yP+igzjJE^Udydcr04dLveGI8mTm(3n!
zOV!f?YME-Se$2`fz9QxM>LqixoKcja$K}&3)eOEG^sw*<&F7vXI4mxvR56#eN#+{-
zVM;jNR#2WkM~0Ssu1fMl>PNq~-b3zsNu3(7uuWq_M^Wp-)^qD7khRWS(!6fGF1y)z
zZ@YV=o7il#HmFwHEPYI$3A{#dmSN)**L>)tv!^wx^R?0mI0!jHm_gt|0n#}#YU|y2
z8clT<i1kP80X#4C2HooW()zBpjw9M}?6d*^ar72C+^&Zq`3BOW6rd#T<fKHPHl^;}
z@x4h0;I+ffqyMS_>x_=QlDs0JqOD=rPVLt6bT+t@xC{?e0A%p88Cse@E-2&C*wbz>
z<#TCw^pWro_1Jzpf=b8XT{2kGq>ZQ8Y?nLPpO3$8`_ZPQZqe6i6?>Z@Ux(j1(Yn2w
z;hT<6qKn$1>(*VsX^boR8Rs?JerQ@|2#<^#aE)ShR*6u@r=&l(z^rld46FWoc};_r
z!ckU)7u-Gj9M_!9^1zZt3-O7@neUUyQq25^AmZ;_gIt>T@v{o}Xv}DdGi0}{$6lXn
zK68JL$6rPZCA77;vgN+1ot|h-8%v{$IUv+>Nbq!?oa`_O9`KAAiFV5#<h{%>l^!XN
z$CTIS!g4A(b$&Rk1;M{MUcJ8`t*+%aPoMC}<blxb&xc%}?H}u`YNI{x-7WuOzi)U#
zA;S3#@YJ`qB%TM}{9Mn+OojuzItKghLS_d`Pv<{YtTttNwr__V^v9<+a~MGMFTevj
z*LIk;$t#mBDz5VfwzI^pz9+}_=bVm!3;pBgCU7GW5;3n=k^4ij(<IqbZp}bJj8#?>
zuf^HBvz7<vt?6;|8gt^-h}W4Hr){U@eSzoQR}HI)psaD6D;ys{ayyHA{c-*Aanjns
zTC3gFnzy&k)%b?qt=Bl1mG~z=?+fQM=Ap`?dFzCnK{sgSY~=Vj9(gC=#Q^qwQ3E?3
zOxp?q3?Cj0<qC%~Rmpwmb4byB-7^w|s%%Z<4j<xF9Qb;}yn1oI#|;B^gE2(C#Vdvp
zorVp&hd)@T7O}Ah%!AHV@i5L%8|0rdvXVc%L>1rXt@rXl-m8{W7(P52yh#hxQU~n$
zLIn(X6DbkJ_oy(iws70$(C;6nno?$Raxk>eFcJ(r>}MDRXb2YS_+jz?D=ZF64FmU&
z_%|>xp%yUk|H>l|_5XTeq3*9T|McO0hQJ^~zdk~pd(NBxlN$k;1NVQzu&&TF7$FrA
zDJiJ0V&Z6OYU}jf&YAk*&jd6A*<Mo12?hq6;x7j)rA&SSt$*G^Rnu8hPL|um&W6$G
zo1L*Kqq~j$U-iK7x^qK=Hm1%-B<?oWwocsce5C)#!3_=n6%8OI`9~IKD?U<9IYkl?
zJ4aIzc19*fCQ|-)BqSufj^E6<l|{w>RUG=oNBZ5_*`6B!aC38GbYo?-b2JAqb8&G2
zm{<TTEDX>b3{D=l&PMJGwoYXKtmOaHBWmho;%H&-Y++|h@>jh^#&#~we59m*HS}N4
zKl^FwZt>qO**g7eSkM6i{z?HbGcp1Gt8Qpf-oIkG6)oINt+hlgY@jrQw!zQJ@s;-<
z`Twt!|8DVbB{l!MB=c7$_P-bXThjl#sG5_hqlldiv`uIJ|DLaZ75;nTzY6jK{u=t<
zNbyfP|05PkX#RJ+fd85_{&!zdP`IJ<NMIqVpbGV&tLz_7EA*Ed>i+Vf&d;TlwRsf=
zMi53yR7lkw_9PQA<x?MaFhJ=OS(u++0Frc4Sq=&9?*NiLKN4wi!2rova;_gFl1Ukf
z)LgV&RLE~WQcw$hf=9^ID7;g%8<U+l8?CWU;p=O3cFV7LDdiqLTyFg7p^E<YBMIz(
ze*LSy#71`8E!<F`1;I=D{m1t!>^l$v61m`;|M;St!Bay*v_h}!|Ceec{kj1IFvzk0
z`3=H@wq!K-i<jU(cN+F%&cz7x|I!!1H%8)q-F7K1)M%mqaY)c^QbQcy|1W)s6->d%
zxxhCg9Pat@ztHe6(!l*kx<I@6|C8oFQs@6O()g28K=fOjrEI0+#gz*rG0av6dtm)-
zmfZ&bY?4t}CDC6Q1$sIT5H|7{noT^)M-vKEG#<|tC*}+Yst#-tD5jKWaQkS#MI|D|
z0qFmHx;>IS(?z3fA|v4amg3G!)Xd>TS^T7&2tV5qUnoD+$ZB@Tjs?(Gl}?~e%2^ud
z|F^5Cm(L%b2J&(}A;97|gZsGK3rLep#G#YA-1>!r_xgOFO|RJ`IcK*(ZZ%&K|BU$I
z=xLbuvgs3@x~RVTmRu73y|~Qt#U|O+bIELt$$<P~jY~S@a)9_s@|Uo3l^~Etw<(tQ
z(%k~YEuX<j6BzpbHX?>`D|kOUUO9&EvmSc^7~PNL{-zc%_)8?zMLJ@SSgPmAB~zEp
zaxUrIS2Mry{&bD8Sf$W)>f@BO^FUne(&uy=i}g)bJPxCu6*V&^6sFxxlhs;2WiyG}
zUA!$>TYVA3Gg8|o`Qr;E-;NtjudYh%j*imUEy$zr*}}?8w9x+D&K4x4h}{TU&-Udf
zmrHAi)e|^#jdeYr(^~U>Rx{^GNwj)>p(|gmi$7c+MM~lGd2(j4y^$P>-{17}z^2!w
zzr|<&kP;o_wgwd8uCt;mR?c_4dd>;jIy#?qYzWjloT<)Kt-N!sTEz6}NUhx)oGsO0
zYfUa`!`<HYA2isirrJ4KbZUu4!=H=alS}8krTDbzcG`052yyR4i83D%*fvd!>=$<<
z7>5mB93IH7a~PlPj`{S{u23PmmaNTw6HTkmJ$%hzu1ssET0*AfEWNvuE{U4V<QNj|
zNF_`D@6H8#irAc>b&F|GVp93i6WdqS&HHoEYm&HJ+RzroNJdK*Jviu-B6dsFnqGr<
ze&=Z*GI}Zr`(p@3uDHy+Ennt$q&~5C0;Cqx1&PFoOg8jkaj@z?wg-R=Lq92|A2rJL
z>CWfe*J<!iqz67^OGmk_BeQ$`o=65MGOywowpf7+j=8h2=s?M^aELNyw=_Vos}1=!
z-~B(vexGYbJW{sk<kE@_$e=^p8$GO>EE9Dhpj2pLxa=-;nm=>g9bSK9b^2TE-N51(
zB2IV3VU41^dyRZYio^BF#^VkeNQ-ee3k&<iIkj7_=)XOs1>PVFKLq#bExQu#w0fXq
zyfqt6P?FE&E^idU0#eDR{XRM_8WAqb{AyIT<H@9K2!6gtxl*q`s&PA4;8vLY9c=oP
z5bn7OaXYL8k^6T2Hd9$@cogL?((1u*jjM8AbSze*x{5z~bTS|AK@-?XKz7}o<ycD^
zOK&_nVFjg<2EW64-|+qS1dc|xqVY!{rcWVd4P4HJ*ETnO#rQeC8+=*nzquAZ0{r2>
zKssL3*%q4|Y73A?CiMAQkb1Sq)<S3@>K>15yD@Ib6?RJr$jW8kF+fD!-z4*i0Q<dm
zt99~cZPy>n@#FowcHz4vq688sqwu*c?uK(JL!`4io?TRr6|^NYmxvdJCM%Ycx^{;X
z6P0>GMRh1MSb7tgL^nAy#N|$iP=ePNb}i<yHTE0Z6)NKY-6biCE{WcK9-*c`$?s$2
zu?(`a^Us!Bw&eJ<i4$+a7fV+;4Fcbv{!E}z=3KrTR@u#VqlCMzpDUlwiKEy3w0ZB;
zR}<{`>T|y+mU+u&Io0I0R$kml*Kv{I&9&h~#n6IPcbl)F?<RVr#aeKPy#1SQKRwzL
zdPGsvfnJ5833(V(2mrnv-ai2b`ZTIlek(q1p6jIg%jOeViOs`Hp6eaiJ3B-1ONj_i
z8<$i0^(Yb0FR$H!{%qeDns`cu*~@09{hw4LNpU?A(ZdCD>89HSa*i*M^Q)Yi8b-|=
zKUMcTJb;YFj!xb8YR2VubK>@1U-WUgqB8#Gi3H}{wO-98_sicap2y`^cRF^1lO_Y-
zR$EYOY@grOXJ1d{=o9ii5>u{=5OmW4K;(zh5=4#Z7bpUw2cTy#nsnM%jv+X-omd<?
zwVRp`^NGc;FKYa`614NgNQQw@4=ZoHWfW34wO%?L#T<7A8F#Ziv^PAzjV^=@b()Q)
zooc4dd%p4w#ctZ_p;7|Ao{9hF{!puM!xfE%IrnQ~vxVGgZ?xr<Gepqm1II^!=Q;z8
z>plERn)Tsg)8hu4lJ$nc20|Y4o>jMFpx0*eJ0*GVux(L;*N1JQ#b&Ey$4PrJomLb2
z1f_Vw-<871pl4Tcv(b$Fhy>c(l+U2J{VKcHY!#nq95H+j+n?EJ#7W>9)A-OCU@0~6
zWaEmr)1TI0&~7G=8}c1$BO?-;K!#3<dU4tOW%e`a!2E2_p@DBADn9$6>tFZWyAmf<
zAI&^_qvprGukwVpbONUWB-eX@KNaSTx=lG?Mun`<JjZ-#ATWD%7~GG*+Km5n0zTI$
zzU(l#D`xg{qP1J&{i*TDIiT^j!RpiclgQz@;)LD0PpZv>xqusEx4B!?(d<q^x-E+o
zP=-}J_QJN_t?gl3SF7DD6H;ZFNT4*IWi|hjXuVh??ZDPW1+gxaO`WRb=jqm+?>yO<
z5I8<o=I=u_aO3^mlyBb*O1azM4LeFRJr6zpH@pP;GW^HL3-HbK?oLn0EnytCK!%C&
zC5pfCQk@;Vz}<Ad4Aq1hHF0dJ4PKkstm9AyO?*7gZ3?<1r+CY0a+7I<nKDS<MumQf
z!W-3Bu{CS_{zhf@TW?j@WYXmr3@r9<%Ajn)%~ByaT`s>#4UtfpbAJCm%cenG7WW)%
zvC}8t$K4=a{W}Z7+b63^YX57RV!ioQ+RraB;QQn4u#7v0WtXMn=|XvDNE`p%L;TVy
z;)?HvW=Y3YNT%A;?P+meOU0_!P*|M7aUH_?*w0X+;nSVk;PqRpj^sV!#-D1X^PGow
z(%a&wc^2{Ft_fLwjBZ&-I0U9y?z;Wnd@FRT))}wQZZyg#%<UHX@PF|L%0*$|Aftj6
zDq@a!PZzR&dDQ`b2>S0M4(lDH!GaH7izm6_Q&mEImsqDdjW&SzLfL689EKF=Mcm-D
z61lKjz1C{Z;c=T-(lPmFvwlc|;mwtZ0P4#Xip1buX(vUuYx-2PidXU7xQ;wy>noK4
z0Uefs_u_~|<Iwkh#NH-D;fXaL)4@L&N@je{hB5KBD4^^H3ktQ8j=j7^Is}xxWaQy>
z4pD)1Kc@<xfr)RBpw9UDD127wcIR+hk&azB8wn~%cL|=!nm6*M4q8WD=k5OFPYUmN
z;j_Qi8Hn&j;J18xNObmH+>uOJ;S3IjEo?jm|K$!VH;qK}NsaZTHx+(G%xpsCt>8cu
zGaT{xUH$r}em=vzmaLnD*?G}N28ZbT)72h@goXiY)p>f*J3OI(BimF<k_aJzsN^#e
zyw1l?Tr`=nfbF#5#y!~E#@yAo5EziovyX&xecv#(Yk52gj2iGz&E_yNY>~B4#vk(d
zn{F@h!^j$%<@`P7hCT1yjtlin%j|%1Vbc9Kr%Z0Q_(_v~k6DlGnjoGMddXA2Co?*$
zZ<@VnhA1HP(9`fU#eqeq{q`k8g|vF7`Iu<@D3Q<)>9qC1WsA5EVgmkZgaH^ze?DmL
zW%1z~A$-3QP6<(SPz@+%fC#U!By|<RZN*$t*&IQ(uKAT8`+k^Rw*(nz_Ne>ZqMAN}
zV@!-}@4T*G8C0!&6;;+euU*<fMbU7-?ed3Tx(jtc?WMib6A59Kh&m6!f)?=158d*K
zw28!_2-jv-R@y292FZYt>0#xy3*l@-(gr94OM85HOPQ|!^y6GVoFBgn3ACW`<m|?^
zJzYL_FtRIyUF7hwzK_8*#_B!2kMHv>M`d*ynS^WNXAEnMNoeMQY+rrnVMFlIY^nZs
z4fKp>(MN8AGN<fnhr69Z22!92MEAbt+tuzzCvvw6#P%z(dW^&i6sw&9X@NsE0;nF0
zNI70_Y5twTBp2l~;nCyiER&VV<Q9c;Bd`|*x6Q9J0;%!h_MrMoEBTDOSnfC}zzKPC
zsov`838~Z_bEV=-)m2E0Ti)U?nRz0Xt7B%@ga*-p_MQ&$El(B)$oI<1&jIab9%|#L
z|AylUvw0)!CmSo|!+1WFb#3&_VKH2%X=gGp(ZYS(Xthq0_msGCyjbNBFM(_?PuT8x
zk5c@B!jjX}YTgE2S?k*ilsn`lW&<x2=Z?ltxT{xc9V^))IO`#zy_`H6cal&M(obaZ
z?4Rt1s#&#7y?sxxqx7atUL&A}zvBvvmfJ($<C!7mqjJX8@bI`4>+{Vj1c8Xc@rd_(
z_Q$!ltCPjrc^W(QD=hkwYePJ0UhS4L4L-T_#v5vfq1;~fv95&Usq(^jyYn?4N^L+X
zNMl4w#7l_^SGU7ktB~#<Ba5j0$$htrUls<_DWix^QE{$Hz9S@x|7xTFBF=LNMkBb8
zkr2(<Ry?ERt!#gcR_Rz_o$z3{UN{h1MwidvJ$!V$K&K)+RjVL$PJ66WOLx^jJa0Ex
z&K32JKM?}aMp#lQ1fr#LT4-uj*;mJ_mp_4t2r7{cizzLfr>cppHEWzxRcu!t!u9*S
z!5{_D3(+pz%1|xvSzKZAV}8b!$$*0WRDhO{KuU+$EBrgk7_Dd`o;9b-DGI7qA9=Eg
zr1IsAuVvJr&2eCChx6jQ2?JlTNCAp*Pj0uvv%Kw;i43l7HU1LRlaV@<{dU5Z+k@S_
zcD?ctiAN5%pVhuzpr(R_O;0dS%JuSEc6+o{xZaws&Izw(<3Op8^_`}7g|Vs6SSQ>2
z`2sk^51wn@tt~zIX5}sV^BlJ<ol<b~=X+yr73B;2cZ59c{R9<_t`~&0{uNrTc>j~b
z6Xe9~JYPKJar1h4*jA|Q;dMK6o2Ue3UOw5JCw}?B{-&PcgKOq@H;0Y=o~&(<=y%ER
zJCdK0J)0lD2!-I&Ko||GryiBijJmKZ-*kOnudYShDmh2<ObA_g%lu^l=CTW0&BmX3
zf!q2QVs}t_(T^4qPF$hy3t>v~w+-l@C395fnxZcPxJg*jHs~PZsXP<p9t@|?6DeHF
zbg1|ZRolrAuSn^Sg{M4kzY$6@iLu>XZfUxntn4=O+<fWP?kN=;nUl{7B7xX0we?xx
zFCEaar}i6{rJ4BsF^8TZeGw>ay%(rO^9hJvJbvL)fg4BoBrkWz0-b@+-gEisc8;B=
zhQaHC0E+^7aK8o49iens_(g=%8p8&{k4+PlKez&BWn_c^LT@-C_Rnk<dkF&(@rHpu
zd>2^2NlGSI9vvnQ7X!6<GTr4rj7SHrO=~ag1Cge(!lCkd1Vre=K7l@jH3owl5cX$3
zlWrM|br@`S592Eu(1<*?u0q#)U-XmJZm3kxZCWUsd6u}V<g%9HncHIKfwlGae+adZ
z?9Lc3;MM!j?ETk==Iy);OU`%iiTL|#op&wKM5lT`_sgd2dF%&@XDtyo+&syxKWyJ|
z0|zSjE?vL-FJarEN^kJ2)z}oCvEJ;5#}{I{TP?PcQ$fz292&0!2?Rz#kFI8lxiCpF
zd!cRZLBRy{&%(%6M652oy-PUYqqW*bl>rTr5QLTXv~Odq-aGS86Jc^y5H@fqiAh<|
zDlHzXZ9qIul0W4_0LoEKxxX9{y-kFWfzZ3dE+mnLFyjbTYP(RwV1q{26wd?&#eMfL
z<LR;JK?ci?Dso@V)Akx~u<&MgOy!A?v<l7>)6uBb-1>mbMmpL{za2>~ryDB_8v?O_
z4lgYTngeOu0cy_FUnsi)^unv%XRBTru65S4{X@n&3lgSk??;@R2!<I#Rrp&Hi-Oh<
zhDldDIu^Hg|FM&JO73iy8&)@sKw-?L;y!%+QrT=?72$U`&kz(UeL3O7UT}psk5f|o
z1mk)7gbn^y)ghg?ka4JC<^Q#BU^)h^*6S<DN`y3PUrXj~w-#Hr2i)Q6-52k(;!G$#
zfGf3t9rpKN&j9|U`y;mNqQ|cpSK<$=u7NRD^JhL#hW+h2dXY`XW48r(bkQkoU?F@>
zoPG~CcdOpD$IM)ph|6>3(<Y1mM@e*k;OdIT3KB8sLM8%vH8N)5-by{$)kdfFbPZtp
z5+G*zv5bNHWpuIjcNr<+Yg<_Fj<vzfIhloBb6;f{p+9n9mQTgc?PHg-6FWkK2G@>*
zIh*YIl#7yY;aihf4pSU<i?o#;FAZz`y;hk0QLa<o8gF*%eIWe$EeVnMtW%9eYirde
zg~mjitqn<6?ThM<8+9Tt!hLlyN)PiZ^*-^LJ7vo+EN-^T2fH%ULwV}IucEB3pFDRI
zJ!-7+T8rkNt`kc*F$+)En$>JOxW-%_AL{8e0PjSRWw|XcyPK~J$1_}O^wFFN?wDmW
zzsmo>0qkkaiNX(CfghrVscylRQ(e23S3*Hh9pq4^+uE=BeISQHf?A3GfUiQ5k8nwc
zs+e>VJtN+E^FTP73k5DQsOY+okEae`y#6$Mt41`Ks3Fl~ehg`@^{$0q>F+h)rBj_c
zYyeoUziEhBuP;@9pggvb_136!r)jrUSm3mNkUU(gjfo!k7Iyn85SML7F?^((1-wHb
zBph}S-QAvdBfgM$FHrBR-$o8a?Ph%K+Esdn8f?d;3jvjlpg=BACShw?jzJe(N2f#7
zLYq<jyr?Ar^i;5I@;s2Kvy=1+9<6v3BGjtBLewLp^rhD=ij_Gfy^vUW$lc=}JAL~0
z?ib-jFr;wH6vAV-SR>cseEh3c)%Tw8aAs2_esu)k0c9NvVKn}Zc>m<}_no!#Ps(;p
zoVNV%G00l$Eb(XGJDIza#hru6?V9h4_gCOx0p}&~dB+!pM27PD?JLkYA1Kxbj5d6%
zMklrVV<M#Pn9lc=!D`-4-Dz+q!E2V6hVrY$qR<4!jYGVra*<%K9d|r-`iRy#!%qv=
zy<w4NN9k6DG<P+^A{+hGZtLxhUu09itPG^$c$*{f=GM;-es2Y@OQbiP#iq}$a6ex2
z?`R}pAV&!P!~jmvR%4U;rzRlQR^Mx2y64Nrk@oYwnH1Ez<s$uc9^>2iW7fQ9yw@xx
z_C02NAGsheJ7$T^T9f$Hs*A>-*@bvYAH~`b@1+K{&KjJVsNJ~V6fU081dDyLuBK2n
zw#L)-d`o+v!$)Aq39IzrD~AyUuF)V8C`FVmb|Zuk{-bQ18OpCxkii~DD#=yK1(ad^
z_Qb(@vq#TXtk?DC5i{uGcy?bJMkbjt)1qcwSu1FyYBSdvk^=ybpiHR!Ic~TB_xzyv
z$!3KOstHqM1bkbA1apsJ0~2}PSX^6prE;I@fE-iuP7qx5+g0;x=7a2kczUD(7{J_P
zU)CgH4B5#9#b5*36?T^?_vBpkuArDl6zo}xhKuET9R<F)469$%r1vLFpJzl}CXqpf
zzRzk2U;?dr%P6vhw@c*=5Pdt}bpG(8KKUHil!sqE;*v4?KDPzWQ*Yw~k{GWOqVL<^
zE&}Xi`6d}wpVWM+Nl<VYl8DvIUG;HWX1Bdg(eBcA)p54}#{#1CPj$i>zDZp_4D>CY
za=JQ_!Fc;6<ZbWJ1c-of7&R!b`H&KiyQ&cTRMu0MzEa`=b*2M)@xHax;T$lCxxgRS
z?Y><28FW#~zn<J!+P<%O&@Jt-5Gz!X6!^=v#?d1uSWYwWi?udLda6+2TpP8_CmXoO
zCE=aLVIHzGbX{e&c0f9kM0Y+@Yj^J|mC5bmESBM{<86DVL}qbg1V=UIhF~*(s|X~_
z<oDrr@h-jfG{y$Hoh}gMn>H|z#1QfcXSugI2cQF^Qi47#fZPi6WK)&zgO`1w5Ow^T
z5C6Q>^V7{A_2z{p{Y@Mf!S_MbWssxcl36SCT^xP)j)0rv>FE*fX+S&{##y&rx&lv_
zBbOnegMBIfeEHATb5~H-0-GoWq(TQIWI1b*!=Qf3;y-7ziQ`dG2r?0Qs7F}SFes*N
z_i~+<BW87NqsBq;^qC4`zWP4&(Ub6XasLM<-k5X+qSNqi1dO?dsvqk7C8m&|p~-|F
zk_8v|pD4{p{|4$J3Bq6}4BwXvt^|u66*Azr0uO&wPVig56nAnr8D)OH(hNt+#Z)=1
z-lh_j%PDweG-&?a!3dOmw>v@RK{ULpu^z@85ARXZ{!(-D`WS1yR3k$2b}jRTkw%vZ
zr0QN!ree08bXsG(jlI}m(r9ba@5Lf{2d*8KE4KT|%|_NisbA$DTv51!nZKc|s$RZI
zf(Ya%ok;M~%>o$6&-2+$vJ5#GuovGzSPO=XQ9yVzcG=KVAweWGhDL9fkw*UpgGRl{
zZw0t)BM&T-&E`^&&*EoDq~&Gcs#)JpbUnCGN^P|-ZlDF`52HA4%~(8|&GB-1?=&?O
zgnZX8G7K`kT&`?~B5A8wRW?Pq12yLBuuA-4rt@d*OT$=6LkP3$K3eCuOZSi0INu;M
zb}m_Iv--(>Bf!|qlF>>~R@`VRt0mp3gm9H*zq@ALxBL^Hi`oqC=k#ym&M`Z{3s{fM
zMaK%y&UN3{+~p>ZWk%BtXGtHU3=yB_6oq$tBe}qI2}^MiiKt{&^YNjq><<Tb$@Kb~
zfRQAi>hp^%4nrlK#tU|2_9vR3GSAwxgl~UE(iFyOH(v~7*Jx>>+pRUI0KunaE4~KU
z#mdD2dGd+U1>QUoXX-vTNk?=%Cu^++F;Z+p89>;d&o9=>1<q1K`O&Fe>4FO=pkaaH
z8AwirAVkp5DiEV5<Y3~yU8&c*R6kIBnASSHqEo}K$|@L(rc4SW%j-<*@n{5avJ*RJ
z;InPB>uFrd$m)A0>+!I;F?Ref$lf41>S)^a8>ja}SP^op^IE{smca3{g(n{~3aHjx
zKKae#_2ITXc;ZENMH5j3X*jbmXPhX}3T2mAO`7*EXdJQh3V<jYR%s?MzkSs8QpOjX
zj#Qg%#=wukmYTIzS56LH{cPaQk4bs<h&4t%lr|JL`hFw~E!DxiltHZ*rQYMi$$=pU
zJvO;3nQfYf2u=q|jI1j@jV-C-uWG_1n;MVjNuk$#TPL}rm@y+Vfc7Gysk7wPvo;mm
z_FMJl(*~Ve6j)Y$?_h(%DsANYzcyRn%X;~xKXAyf)r)B#PG7Rz;JO`$Dn6v<FBl%L
zTww@(9~-KUI}AG!3Hgwm)eb(iUNFzpK1ZqWO=UGzZnK>pO~^L)C=eFQ4DGJOSL%=Z
z8|n=&1GA+zV2d%4t+(8$+O09?C+7B26eLO!Z94W-E4&wt^Kq_hnLJP;(xu@vaViG;
z`r|>YdM(h&W<#|?mPYHP9VDc%7V0FGjveL9rqYqh;It?4oyfJlA>A)48x6beG%ny#
z^zqoGCJ}HSG~>R{rd4pqY<cpHVbtaO>Wmae_xZE}KckFBnd8>jyP&0x)#VYwMu{IF
z`*2vHMu+G7{GgAar&Yjhbv(`+t07N2v%^a*D}TX-@(Dqnh+11sL`!@YVe)4qxuC3_
zPmovX_WRPI?R-*H#pqW@Wo?&(im3NrntBKW?A*5#ad!LmN5JA>o7a-M;0ezgw-v7i
zJm@7`=xn*H`&`i46Rz&`EV(S-o<Q<aifOLC!Jg;T8k49=aJgKgUEWVQWc9d5m$>Us
za4#`(+{kL4Z&51Wa`J!ym%%NJr&92z`5I(}LxtY#(^IREILRn)-v;ODyGJhakj>@h
zUu#pjfqR03;;K!3>~(iKAK*)Es$T)|re55px6?!cRjJ$jsj8;euaSjg(5|bBeDoAe
zn9CYOx_@i4?DEHM^2aBjs3qNcol>xZcB2cw4{=%V%6?+eF+K@Fl9GB$;Y=U$7uD*y
zMt&VZh;VaR5yUtMW)sTTd#x*gcbjo&kMjt)NLM+UcGco-rA}K=U4EXXkwSMx147v{
zGY*}Ww(lHj*TBPm9Yc1mBSn=D_=Cq`B8PK*H3I~=&{XWr0odBQo6Ui}(hct9Kmn_`
zE!Xfi1RJEU?~Z89crdM2cZ+IQRlMugdmt1r`dN33?vQJ#SQ+iTLV6`MV1_$=E7*OW
zR)4&c=|)yzfZKSzH|o5$v<wb7zb52yJuE5;GH8`$dM4EAJ|ER`%Copedfjl3i{sH?
z92gV%CoCI=s65TTtTuF@)RSkO8kWpV$=8zqY;5!JN9byFTHz7P9~=r*Sx#Mk0zO|b
z1^i9@L<0Y2M7<(OX}jRyV{WMT8Ip6CI_y2#Di~N?i$kZYsFPG6=M`bCgq?6P`$I9`
z7{R05GSAjflsiud7q~Y>wS&f17@P)?)rvY3slx@erVzu=^&5P^FYn-e5hKCw`N83F
z_3bB(Nv|$I{6UOMbF!nT%(K>X>~|#Pl;!cV;8qC+Q0Z)($5w-pk=F9kp|YkXv!smg
z3zBf}>C&%!lM{>|7brqEql?!y-yYGlMT2}dV?K-X4y?z2X>Z6tonhB8Ec@;K8OI~f
zuL${}F09?*n*FPmHk;MKLo-`<rM%*+&<;b2KqY}{_lp}!vPFbR*lr;IIb~zXOE|4}
zz9?i?dNdU4Mgo;THWH6@Pyy_l1PF~z0x=pSnP)SS&8~Z@X~355=s$y|x_S2aJixcf
zUqw#bPV(&PI%6D+qQSjG(~hb>?a?jho-Vef$&GXld@dyklUG0FAH+;2qiA;ggB?d)
z_3C5H>%gcKOIxP>zsLr5mKU!Pz(Q5Q2AXOdPfeN8p@TXV)--(VIJ6@NeI+p%Avfn0
zkr`7*w<$04_4k4lkTbLvPSN!sT1dAwpU~Ugn5k4|pQ!|kFO5n*Stnie7iM#}!)gY%
zMaWSBCHqidG3z&lG?!^&X_((`6){ic#~0meV>6HGq_@QE4r7?od3^ZKbd{i8B^=iI
zErBxa+~rXAyTf^d{Y#tcf-xQ45z=+U`eUBce&&=MU0u#g2Az7gN#IDk*FD!GR1P^z
z&Z;z2qSAYmxRsIU&CMS<;?)$#QUn=AJ}(I&f0h62PV;3=-gPdyQuA=9RQ=h9iiplM
z%e!AnB`HDQ!c63m%;k#ua!8bCgi=n2^RRTj%w_8|QE=dwE*%t?oGUpNdTk13&}rm)
z{Bw>wL0M-xJub!LN`G;Zj++~@`*;mH-s0Tj^SV0%kx9g)(LN_7(t=JB#9j;oJi9g$
z@Hl|KHR24x>yi2UwCZ=X#H;-;aEKW`Cf4xpLI$ktIxwjt_P6q7<n=h+WEJCuxG$li
z;EiF!nxIg46H!L|@(jy@;r$~H+*_``w?1q$i<JP4_(Lc!Ax}iGT|8arqHKNBc!)WJ
ze*j@W4YRax>T~hAS-6x>@0#O~&Eg)DiaB};0>W59Qavk5uKRA-mh7?x?tp(GemhoB
zY%KHB4cka5I>-OuyXj$fm*=m?5u<of(-B^52(dEm^uR|~!!@(Hl#zGCCG;*XpN|@S
zMLIMpQ=>HkerW&`I4t4|C$6Mbu!~wo%bHQzx2h*|*GV$fUvt?jKyFDDy5-Y}rnMT2
z{lty)m$OzJm(+9`m37%4AZ62kTz4(Iq`*x!ID{bJv^v#zS=n-xSfS5UMSA#@%&v&m
zz&5UTpw4pVJ8<86hDSvE4?he|vU0usHTg8h`ppC-;XKS3EFL-JTYU>#{NdZs3ahav
zIsKu~7=mlrXV(ge@NRj?OJJz8K2tC7#Bl1*+%?F+{%1mBvr2z>ojOz?1hQC{k&ZVZ
zyUG^hV9Mjqpdhr;#-t7YF~R+6IXNz+0+4dXYjoOe4VGcU2XkfyFl!!8S@}6-?76Qd
z4JS&zw~T2e4Of3qi?2T<K6<FG;IF(Vo6EOC+n3-9Dq1gxJxgAs_-*hCEB^?!eDGN5
zH9&$V<aTkm68h$Z37^=C3~+F-jG;cP0e{c6=WQr@gVD|57snt?=Y}Jnq~8wqs0ZI1
z8f1R0HI5KR7q%X+rhqIN(~4R)qL*FZKoQ8yhKmRjhi!x}GiFb-u}1o1)nYoPU5AMw
zs5&b>{3}80uBSX)E3^BrKo=6yKMomuZsRl&Pl)d$KRw8b9gww7%#zztN&%qqQ?R}H
zwS$+D-*xYJATzFPn8GHGFqL~6C;|u2!oHX{Ao?H{tY+ZRvna9pMC@t*e1Uq0QhC2t
zd74gO&l7uL<)ntG^pps)-wfD4wPee1-NcQ$z{h_k9DO{UFM`4N4myMj+t(aG;cJ9p
zUM3196OX<d2}u?h{;^Q(bZ`+TPt?ZC1m<>r2*b2f???xAN=fj)1BJX#{=24=`3sZL
z@OuWP`m+Tx%09v_RO2iiKN6&_qrpkZZDO*sr*{$5m6UPQkBIN_cGdKly3bRP&qBOx
zw`gfOx+`nk@0OAm52mhBR<V)dD0_o1P`-Q|?Ht#TmEZyLJNHU)oYwTMqA-SpiVx~u
z2DW0P6eG$+BAkG<jwg80?Q-8;<1oy7d=YO&nDK8(I7X&=6n_Wmil%AP6l}ei>SUmf
zu*-z%_yo=t3%3<*`!f)-WRh1<kyei)q;#FP?1XWA97e<EW&@vxp8lzkwBn&$xa(C9
z3ldoMV)<r2wW=<i?5Uc?KzwMpa%U3(xi=kwVqs4;ybwj(UE&Aq#ag$@Q4LJpO-w7y
zx2O<ZeRuwD;)?Jd$CaS)sSXiy!ri+^P$ox$i)_WM)UiS)X)rMjx&1&ag$(v$lSM7P
zc3ZClL!5wtek$uRK2_z%#yp5qVutg>P|&d-X)p>ME7+;VxKCQE*0ntzq_?bo1swZ4
z?rPoa*_o&EFiH$tfu*k!d0m2h&cub=fH5j6mpVg*XQfg8$HDe>F}{Z3!8VCE?`b&b
zGn>`Oy?{FyCEz&b>Il<TwjWWT-f3^#iLx^Q@VyD4no6-2jByLhaZjMv(w!OMUu<?t
zrv9~ZA`e)FB6UT~Q~5e*RK!=j6_hbvb)pVKS<gU1;#r4CLIEXi=SW<c!ARF61|4zV
zmtVaCsUX8RR~7%SH-|NS*SmMib^`?;?mVvl!b8-2Jh!n=6m}bJwW-`**4<)P*|))U
zn$@IG6F9e`3HiGS&tDsn#ZX(H;i63ppv~%?(Li5eDWVHzaz^tt*Vs@TS!>$+%9@?Q
zEInGa$eYP{s0A3e!sV8j=~3RLJkU!lJpU)iuooUhK|oFZ5tI0Yyhp&c52uv-8EziM
z{)-~iKJD28WqcmWfN?(-$`b+lB0Lo4HprjK;2m#sg4}5|Ij8nNc|-VhUMyUqnlxO`
zo|M4;{LTke8a553p~t7^hU0dXnG)5o0;hKEm>#IYa}}99!^?JJP3o5nmaWZ#pDAzY
z)sC2Nhg4j-Ja1B37!^J`o#2jK?E8d1)xH0vu>Las7<pY}nK*p4U=lOT<zk}?GRnO(
zFK2yu6=?CSvarwmI~S(<#vYEzVoCNC|L(Z*DMS^*!6v0Ktxo8YsuT!rl84yplC`~_
z;V+@Wv*2r>t#UV9rRTlRUff1|aoUua5BfWTXS(~;`JsQdhsREJ)|TYtYZ;<rp`k9H
zx8k$hsc?5=#>YO>m#tmT?&iIy<AZNbyj>3uY`0yzeRX(Fw>uuE{1(Q)Z>P#_F1&b^
zAIZndbhU2IJ{Py91lWJM1O{Sz)@EM`c`Jmp_BDA{`4Fc=G+h;e8Joag>QRk5LsUey
z@sPR3VyUMmZ;VH;&mGakzyqOO;a^Rk0Lp_SgoA>+)3_Z`7#l2I9Gz_NZ&vI&GvB<S
zygL3<Uzvq#Gg|e+J^liq)t_wkL~@mNIb{=6VA?+p>8*o{Z!b<p*RLQ-plI+e=>Ni*
z26IoC())o?GV&NB9vgo|(3bdPofqP9CuaGD71%I?%_I$5VblSSxZI2<#q`;;J|Ajl
zp|9n;<SS@7UtH<EKyd%#e%0?g(@m+rvUd2p4p<;lw)>TZ#EBM@T?20dPqJMDt_|I$
z{?i?}8-x0d+8ck1huAJ4X?6{7lBMO(##-|U1lp4AFP3%Sy8662%G4hWoAY<^797S;
zGvUg0l17AB%iRF@r;w;OV9nr8$Z7`O(UxQKD!G65Iwdh%vWN5q+9!T%&56|B5xIxH
zAVq~l-!+UBIlj9Q6dmhptSX1N<F(wzNQh@7%~4B`Cc-AS!5UKa)VCHWZnb5a>4{3{
zTUDUHP66NF(eA|=Z~9mOwjC(Eh-g?4&R%U0LA>KkpQnTTCe>A8x=i6i&Z>p8qTm*o
zQCDyOEcqa|l~TRk4q*f*1;<87?Tj`x1h4;d)vw>dFZD0@ww+9mM<DDh*I1Ni<uNMa
zEpyoC@HPPzvRS&U0%T2Z>1Sty9HH9R_o}kmjZd1{5rcx893+&Ke>X*i7cx8zVPN^b
z@IBK>5mcd%nJT8C>+=N2c0DVvjlzEkKF%N#x35FcA%ol<%xEioGC!BlQvOl%EmCE(
zQK>ymxkfYS?Z#Zv3K~Djsg6%x{Fd-TCaZ6??4w!qjyFlGv*mU<)-Q}dCTrz{Ur5|u
z>VjDaS|%`nD*4hBwr_xiXW0=oYpBu>ef-fx0$)&)%VOD%IjjWQ!$ka$R;q1SPr<m$
z;(~oor<N?1>ldLcNC70eFU2g;+51q9=3AbEjt9$xPK_&8%Qv0(Gw^;LM!O|0EZ#Sw
z04Um*z{9WAY}rn)*DMXrXc*yBYpB~mkg!HHxa6n~>)43>9&F$>m2;{y$0Oh2pvVmU
zub3s|*H?=b^uG2tl%6WK#NW!($cHrG{jlsOe~az(yuID=M|5;gWW{e#JBvuvkA-~}
z@$xc13b$-F-o0mWUXb(`%OL#AFie3@OFfMPEU86PSRJ3?vin(3Jn~7KQZ{3YO1z8o
zE->x9Sza9xw)R^wOAC>~WKXef`N{HqJg-LekLZ$osHDEkZ5%+!gSI5#F!jm&BY&O`
zk55f!03NI`4gIy_PM9Ytw+@qD%l9meY{9ax@sQK?Mwx_H)x(wg)@(oI>ISjv0w`Jq
zuCfB<=z2&(Ek;c*r%d(Vd<vRVXV4i`86K|x9zNBQk$w>Y&y>pPQ4&eW(Nzpm8`)EC
zlxJusoOMWf6Ol}hb!*XLy+&}UKG7@E>v<eCpQm1)_VY3ei3&`KDzlr`yI9F^vFK4n
zG`NLhf!>)2FiGWhX<3)SX#3{gd?a)A;x*eoE|m~LyU=Ynai+I(JFo9hgSh;<m*&Sl
zn$0spLp=KK$z|@OnZ;=8TP5=*<$o!%>X(Y>fpY%DZs&1b!`v%K<&;D+nk^ibn(Hz_
zb<=R==TK#6n<hm7p1$FxSP~(VzCGb`>pc~ZHq#`*mGP)t7K>crV{`;`w;Vw4h__<3
zMkqHAKey@FQq7!UlV(IhqA#Af;Y{r-+H_7Ce4<*xXE(svPVLY8BftA(+AE?SJhxPC
z5k%E*O%Z~=!>?NzR+-G%6-NI3e-e^E;h7w?p9^ems^@(`X}n6bSEYOgB*Suke}R|0
z89ar&%1qfGyIvBZI>p(=$lYSQRPHGLNz8zH+m~NEBbb+_*20)TI4z$$;;+I95pRkw
zoV7ge%U@sj9_vaoI9;^YG}OBlXy_DpaF6w5k><B+=j4@DvC9f%D>At9M2?Y?T4(JF
zZGAdsNRPvWFuGe*Qni(UwqnhSf0WFG`AshIb-F9tK`Mp5YR3EAS~--=Dz?XM^l?TE
zA4(l$i_}5tF0GoKw@|$REe;lo(b0Pb!(|`S&o-1zwN!4b7G~kdTdt>zR8ISV$=}>t
z=^Q1c41RK13)-JAIheycIPc);AmX#k4=ZzFR%)~wKVP093f)D+17A`1F8?xZ%>KsZ
z#J^#V@p;<Qq?ADPNTpEzkV9edY=qLnF5ELo(hKBn@*4sfKF4AFuJQ^M+<3D2mLF|*
zxXW@cn?-+o8k&6{*|;{S$K?{ZI22EHtE1G!=ZE{r+VA0cIhA!O|BY@qxkjy1$j46I
z$K1*1V1?0mC@UxJkU4+Te1%iWK+IY)p=f>o>5B%gG3?DE)DF~n`AbqE)W*2?^GAJG
zB%uAe!?av6h1}<R9LnlROI-!|OkN7~i1U_f`Jn`^_+&L7>yw_w4=2Y5ak)newm+?p
z`ml&3g^}l{*Q*_XzDpgsK&fDMG-7Va)?uWE=V3rg2mec{uGfZl@B;oQS189L?zV5S
z6I<@n=gxZ>Kg0V8@4vI_<mgziY*Hx%%5$yum@xBi><KsUp|&s#49hOFljUh_2@ntB
zspGL_=cMVQ`@{4~^*HGXF<h#Y8j0v<QX8Jzne-mSJIBcG3W<ku%}pAQ<ND-L#+xfo
zJ-*I-;fZmZHlT)q(p&B*ox1toE`dvId8$LdJq@6k5shWQS1972<2}RF?Kk|@>|pTn
zs%HrmX#5)kSWDCBw#rk_vUocs_t5URYgc@`Il$d+1x|vR1Z%Yq<K7eC&7A+3@N)iR
z0hPA4I0mKiC&)EE`&S+Zj7h`4>V|J3nIuNMJwV5Av`z-RjhUJ2_zOhbef#E-L|Md3
zGW&&bfOG)~BuUJdmz^Drj#YV}%Li|D=>=6YSj^|6rIA#EAiq_CzuKTG<GqwBsK`*I
z-%%938@+6IJ>8bpaFq8ot@en(T|5&7gONdzpS>r`2TU;`(rjEijIXcp`xEeVB2DC(
z{3!%;_rpJhcjL@X|3Jii?_lW`eQ%p;=b-?6#)N?<p(^43VW@>9C@9xPX(Mo)ukwX*
z4!of^^lbQHKob_b=ov9;hO~%*{kLBlyo}j|PT9zkdi(zPE2B-qf!F001)H4`_Tk(n
zW+vimpXkGBA*9?^38?X9%2mmj8fszkmlEr?Q^G2$(O{O8T+|>emB)9bwD01jotq{w
zmFMPcqZFr`{Jqu^oo~B+t)C&d@3#IyuLgpM$M<E6Zot2tXGG6UY$n*zwi~b|p!V#b
zc{@_xSb!A<f+}5tzcbHuYBq}XFMI?VZOm4A1Q{4z_(i<Mq?F61SZ9EmkY0?D__Wqf
zPx_X;sKxJCkcnyfbEw<0Mk>wCoeD^=`-`}Aurqv?S_>r;m1(2yM1c!JJMN&0!3O-E
zAM;hZgtAOH;Lkh`E%e%V?Q0CtG#cY4jynec$CG5t7GI-PYZQ?EGt7v2Q(fm}dgU_n
z+~ynj?SjM5`uqbjgwbE*kEYN$F(1vK7}FMQ`=!<D8SDx7|FHL-QB7@K+pr)?6H!1=
zy3%_S=^$8;E+9>ifHbM0_XKGoN|W9}no94XN4j*SLx9kG=p~Q<@8+Dlc<OyW?>ojf
zz8}vYMo3_1t-0o&YtCz3*W8f;9d67x=V{3Os_U;~wqoE#-(q<XreEXyX+>za7)~6A
zIA>g|B<X)zAYW!xqY|>OZS1$Z@d%Q}N==6g>ALY=Yz>Xqcs!6_e`u)t_CTB57d3iA
zK%Q_XOTj7X{*?!>pA2hOOI4vNzwud{+`%TQ?Yd;I!f6jJqIywx@?RF|pabJcWUu4k
zG6pD+dk5Cdv8gH|!lW*Nc5hF7X-E%T;0mMaW~4kOg3HG&2tBkXXJmaDDY7mS0pOkc
zQLdBoq-JLCUJDlE-GitzBAfenGLOSV8T6a@4utO?!6(zP$UD<$BZrV<fSp$~=gsyO
z0Xwr;nJ9y+Hv3##;yZB}v-FzrJ8D%93vw>b8`?7IAwpb(-4>M5zSEQ|&S_Y}fql7t
zm0tSs^wRj%;_fy)zb%L@F&v&O%92*TnN!vzE?rA@BET?&vmkM+9ZwtdIS!8_Uo3as
zGiufouzP4)y8-E9^dsU$)>i18z`0=H{wR5TKK2RBj(nRELCfvE-itPWhy3(}HAU$s
zYvYhT>BeK63QO7xJsm_!UwvzEX?H2cvm*BhG8^V?&msyy4P*J-j-k`UI5#O%!SK__
zv^4@CM_ldK-q7OhS?AZ+8&K8Kt_Y7|zeBQCx5O-~o5X*luUCk@^1$FxQX9M5MFPm>
zD>1eb(CAfgJ!hXZo#jU>A{qx_wGI4i+pad&=ZWR(>8;(1p{w8Q_HRkGn2|G1NuSw>
zabVDytetvItFBvHC7mx87*q|mGs2&IkUKJ4{=5yP?EO~m+-j8|V9}u2R%K5xcrW@0
z)h*V#uWz<ci@ffA`yr(^#^bOjt{xiqb(23|^|o}a%EoZ@5>+YqOg6YTT<8G6vH|SZ
ztgv+Bk~O)J%atEg8D-$n1}E5o3ueGKjZU4`_RCIFnc_p9&4tGo%?>vt(jn_jtprU;
zMbBat`(!dlwn2=BkI@wvh9eWfoTpcD=G?-qNCQwddYduHVjCmFQ|=!D3hy`KZMO)r
z_qSD(Ue9qGW<~5^ux}2!Y-X#Kv!tOtEt>nQ!;xyzcD>MFHADmta2uNVSe@4f@@m)o
z?QYUblLr4>pAwS41`S7jg2upyBt`XNhWNNe{Sz{AzZrdbcjOde?Kj$nP9uA5e3U3?
zM%12t-v)JYcITGa5i#+g(IQWiBr6p!_DlGXtJHNZukWtvn(JBWPH6#TjEXthxS6(M
zbc#pui;sL>;(qlK%sM1Xyf_qeDwfTi(@5H2pGj;VKCQkx@l|ocHl#IL#~Bl-^q#IW
z1|OF@R3LSoAF}8s=(Hinkuh=auI2`fxBo4!FPhm0j*~M<d|$w9itj-Nc)W%+S!(Nu
zK{nzmziyK=@)yY2Pra8TCNk)C9i=0fvO1`m!!L)w{b|m>$WfbuF5oTHgv$IF?y!HP
zj_S!B@4;skn8;$y_a73ILmf`JRvcetAQL%wLYBSdW%8le^*4_Gb5h6XOQT>km0>36
zu-g5)_H_jxYo1bqpxIYR<+q6!0+FAO_+x(m?f(Xdr!QZ7tu_lb?}-8kr>h;y(~EPb
zHhNj{J7f9{6XYUB;R<<*L~w;XxJUVK5`o{!R25zWU&Q>qL-NmsQ@;$|H|r4~UhQ86
z)ARg>diZl;7jd7A5h(Wvodroh{Pma_Edl*%Qu%R`ywabL+y604pxxF}v<hxY_k%wb
zv;AtoC(i+~ENj8(;*ZFm4rqTfq6>t~IJgwhsQYZY*A)I*NgPQD=w<)cO#fe+iLsFg
z?sMj(by|gvGpKXcEBw6ga|V#q_pgM<{*CiAl0ErwCooGPMbS>ht84<g#^V_ET<yv2
zMnd=*&~YvK7*%J0-i@4a!4x<q;l{D5SSftDFZes3_|32P<rwW%Zsi(Q?}TH&T+!(}
zb5P%?;wdogwU1*~OO?ERSB)%s3p26+Ul{E`-p%srM}9D3WO<wVlIh>~;U7GUjM?`r
zT41fng71~daDKu@Y&k3|_|TR0<_uNF=Eu2Dct+`ALcbZt?>zYa%R3kNF1M?td|1~L
zY^y~lF$RFD+(hls0j3%`-zgyE15eHM|Hh+jaIg8ybl%fB@R}RSlm&QCK4K7U4R$2e
zHR!Fs8TS)L0rJ;d#3m!$w+4PVMx_6<7eG70xTSUrb10*;F#RKHXX~QgoEA<vjD9-o
zZ^qE{?t=H}#>r9Dd>voeM6|e89j$&HkV>S~GL96Ua3yRiQ1M-;(){bth(iX57}$KI
z*f=zEBCf1#yhY{u=kiSjA|JG?uK2@+Q9ZK4@d<xBosZ;I?klBVmxbjkmACr`-Kn65
zw30b=be{l9q2UGlPk$2@nE?e?;R&W_UB+8(XTF;fp@pvn0>)np73T(2o}{@Y-4Fjd
zg5Adr4!rMel|}(2?_xKW_!~2k-2j45Ia=k}#n@1mpIBbM*(Cr|q+SRF5y5|ilP&)4
zlb?Tm@(hTH8vlE-Uv2WgHv7q+{?|2rzES?@8or{8_KV$m)t;za)4C;kg;Yro+Vu~$
zKmQY>?;4x^Lgx*!Gt6eBxE7~En)J!O&Nu2OjIltzlD$Qv^ne3x#j29Zd1g@0S?wgn
z9xnA<aNG}mdYse^s(P~I)zDPt*e7)>gC}ZKDBrM5n^iUO&J8YUK0ZmE+a(ODe%3PW
zMp(BF;DpL_br0<PV9H~SL;=VLu_Ety-d^_|UGL)LgR@Gwu19`}YFFBR`N(82)t<M-
z>%r{iq_Fi!M<q&PP!!1lB-Xc&c9)|3F70#;sKrI;1Kj#;1|wWaKYx6m*o3mBZ#Wf_
zkk#@mr8w16q)!^OjT8IiBi`t2%Scv-W=;q449m2T%FP5Ec~Wj&(1xD*(@Hx&dv}B9
z&e6^yVSG5@w*1$<>`6aBN!>BIvI(?>Fpu><+EIK*!Le>y*e>Wh>RtG5A&2F7b)pTn
zDZ8L!QupdZQ^OBg+d1mPDU8cJAe=M>_^+}tgiFfUo)mk}xF)_pq$oqE7=4KQ_pWG;
zOl+~^m#mP*nVDU_%bl-%{aqy5!{~3TNg9gxB530zuz)@-%Q@lGeDtw{U$GCe@YStW
zGfa~)h}M4_`F^Q4B`SmEPVWMPo88Ch>t`>><|tdtLDVyDoh=R;84pWt!Z>J&ccvn$
zy!IJb-nn4&^QPq^^uO&JsouKhTujM4*?)^l+&8cDTl#}fyf_J&ZGvi&ycdrTV<a}J
zr1t30(W7-{dEB4|4f<!0BaIj;h(@!Qkk7}Ljw}5v9J>5)Zy{U9uS>%K5Awq;Aq%BX
zVW=$63Rp9Z;vFgRfjHm9a3q*V|87h!pB7<s;P!|D<Gr-J!ZHqH9m$&Q(2I6^#t_Q`
z^|_mL5`iGF4Ymi>!z2wm5A314+ZG^u`Kt_f)MB`3ib>pG@foZOobU%LE6AcJfm7wW
zQ*+^<e=xq-l5GnOWN^Y7*DT!Yg||K)coMQE@05(iQ9v&qa&40MjxoQ9R(tNlsrl)V
z_rlX6J01?bjH+`XJJ9q%dPQbhNzCgYIZGu;`(6Qv#j-z3;Yv_+I%0X-ecoSuzv9~a
zH%+CmWX~yX4fORf*e07^!>pHHg=eVr8(Oi_F1Ip^Z#^O)hC>H(Rz=L!l!d@0u5anS
zCoYo;3o@AMTtGJ5U!{I=<iV${wRbGCj}jZa4^v>w*2CO2wiZKO$HLab9fb^T61FHr
zZBU&-%xuv`W=frxyVabONjE6961GnaL)}=)JcDN_6+dHknF5JwSRT>H&y3J~m<iQg
zm7cPh_2iNc1gVpnZBx5$NKh1E)N&>Ibc#Q-dG!YEgL<C3WVUQg)*Y!DMjxF9X{j%g
z2DMb8#NFwfqH=heW{SxM1?;c1`M4!Zc@5uMiaR~#I;Cl$Y>B^bb6~cRTeRv>0zGNF
z31c%jcO-W&Z9R-<H^c(a+(7X&9^PO(sXZdb_TRcLj>A$aaTpIM7OS+kdSF5+l9OHs
zt^nI=esr7M8A2j$L#9|#{LQ)z=Fxzxw5?rp5VoDt5TXWDQ`X{4b7`+vlvs9-g%_Iw
ziRlM|me)LXsg4(nTlUG{_AKSDfmPgxt_`8XLYZEa?07*!y>?NnCF(CSiki3D_Wf$q
zu&x$B7SdtA>`>s0z`WNPLfAba(}y9k)8BP?K@{H^M)fxbBV5)*L<1(cp@$5j>`w3`
zHm`&A7@4y=_N^|>s&7ot28V6JsdX`=0?vXOY1*~EL}B@nlwDu^`7%{h3Z!L;$Xk4Y
z=h}?stKNL@d@E<s@}dp0)X)w-c_!2Xv`~pisf9*&@@WsI1pzWhLri-e3yNoFFv=`j
zIiY=@S>Zr{<?>ZmFK~;ecSvL4`&a^R2}(}guS0S#frc)EnxP$6Zf(Sp(hSyK4@ya2
zy<*yPfg$HTC0|T`Hhs)_x0E6CWQJAzy0EqHg`q-6Iz`eagE}}q3Yl;A7uqLlAJsEP
zqB?!dhq?9Uf&LG7!KxICfr8p1FU$BWx7VhGKTgm<0j>NM8Ue+Po@9m9;V%n1Gk~70
z3*dBRFM17~Ob~rNT+G$V+ZPMqvooU8%k&g>F+_d1L`-E3#{wGuO&vC-4Au*24FDhK
zfyFq?t2RqDWxVJ@;Tg?6yGWoxjp7hzOntwAdiQgeGu@*TPBDkstZ2`5^?e-;h&Jec
zB#YAGeCzz%i};Xi?jW#w+DnnB?5@}@w_VC_+aTzN*+=hJi-O)!@X&4vd4I~_*X7VJ
ztfQ53H8}6ta)seQ>#NB|e??FTR=kOHu8=MXFfPoU?xcEm$!xM_|M>J|;Phgoh#Eb|
zv(K-edCqt!WV3F{ih8cchtLW?M*7?XPjR9trY7LjgGF<Pw2Kw~{9{{?!Wuq(?F1Qc
zWg5*V;AG4p1ySx%Hd`-SX*0<x=Ct?}DyU=yN^nEci77;Sr25@}B`Jl5u1Y56wLx-1
zZe>I3$BpGgH?B7CEli9dYmSZE>OTVF_|lgPq&4bx8#RD#IU%ztKsRZy+J9~0vGC;$
z_@*>Rx_6pMDtYau%Bel*vS*=S`^m+PfmLX+4x~PU(}feoMh^-)KIVq`uubJQus1@y
zo7+N<*T^PhwrHoldW0|pBWBKX65kyd#5|vA7a8WIg-77q`6<SDc5jMxR-)-dT%)_6
z71~DM%!jXXWJ3|rS_@yLzu+|^X!%?i9^Bc8+s=iw6)mE+TRyGQA=~NGFd|@RH_aR%
z5OK2&^ZYst?v8*TdsXb!6t!+<aSS-umGBqG6^GS$q7pS>C8zgaoYNUO4m;PtVji<z
zt-7K~umFa^!XiX)W$mTrYq6Yf@_H^f1YM;&;7q(J>Mo4FY;#ll4agv*u~jK{wSoJ2
zM)XpmFmKOHLgn82<jBLoeZdIf=GT1q)~bL)dspIA<`ms52DW`;^v)q%@Bl5c7Mgf>
zH}C!R5_!gZm`F<a#tB(xJ<f3dO^neBC8rh?P)mRK!8H~wv=pj0i?sr1hP>q89Q*U`
z*rBhZQ81z2iWNY>jqT5TC+fOhwRS>xvfKJv*6@)7Twd}x-zjdRS6T)1GPvQ&VfuuH
zXnSD@Zib|Rx5G;``ngFS!*OD^0xa%aV7&w!r`6c8Xo$OvdK8CQjAdQxcDhl>w3s?k
z2w{Ui5a|<dpoIGX=(GQl0|+`g+*cYDF6xr7^hI7NZl4{wq*|xv+bZ0-e>ST`-fBjG
zrwppm!zNlm&rbXXbQ-kb9}UW$0>tS!DbcivV|o+I_TCrfFa`5l%hg14^=5gMh528>
z<9p!xn+dxlBanfjdlp#w20*c|lVFeJr_G>7He8A2)xRE5?RaZGW>ObB>v=GRsd&*9
zN-I2`rz{G-Ic3h>)(W=U%9@&y$(_~2WaZ(XojxHGSi~*1+@*vFv{ZTythuc($}7Q7
zFG^Od-TUrgJ2TS20R@D@Q2x<+uW$>Xt5@$MSD=rRYW*VaYa054V6~mC;xIu%mT7W=
za`4WeWsO3ooE{jT>{HJp3bU;XAv6t%_0N4g&7c!;UW;O+ctYf47x4#%X(~d(1<;2`
z9|_VIojRXJKF)j`k$n3Fc4%lhQ)8S4Kj$J{hc;dtA(8B!kzEJ6CrKErh)=hLW{s{Z
z5dl6x(OKU}Q1y`j9u)ogW#N1D$5QWB#XjGQ_)?lVs%{TylR*^FNeo-Ou9Mnjd4fs|
z=|et(*|JqYxWBq~^Y~JRz{Yj-k5?PF+*SF3rU|SCfIgm{0K3}7$m5sbz8hlP8HjM~
zo$$EIFyWO+?5-+!@^Yu?<c$E?SD{hhG}}2XG>u<D27DXt&>Cnl3Ut*G4cXqIN1*+a
z!U4b7zc{A}sh-<vuV}ftSUp4u-M#~}J0W$sCE3+<2|v{=j{C);N9}VGy6^^mx!M!S
zg*6S_JF&NxKKtKx#?9f&Bya2XFd-KEXju0B@bTxMZ|{-pRfp4NY`si-EVH%`Qoo0@
zZ^sbq8JInMWS_wAP->pt5VB9^zfIPP=hSdp=1SUD?adP+CUU3L>1qj%K%;h;F|Og8
z8&H$!#EU0itB`V#gOiC3rsy@y5f%OZjST#nc0ge+?h<%RHd@YB!b1XHmEJ}=Q9$S5
zq>%>1-Iwk|q?f(`Y-R{fxlh#vf&j*-P4qU%AP^*Z^9sXJ1*HN6iKbD~Lr}L-N|Mhu
zryuVPSKoR~($uOHmn@2X4KO!JCJ#eJSB0)@U$d2yTQVB=V2XRAWDqV}m;Uv^1$x@`
z*9;<WgZLw!$)yL411qmzZi5OW9l2!Uao2g2py;k$3q4R704slbLbh7}i}-o2Tlm}Q
zkGI3@B6oWsZ<~sI&hTiQX6F^;pWs<zXO0Jpf5<<d-&zRsyd8FFH7+<RXZbEcGwWy*
z-|9Z(-ZA#QZ!c6O!QLQ@UPzT;$>|0czKi>!9+6C^3ct(!w~{`mZsY}Vm4QXqnLgZS
zfRnCKksJNU)>pI0pP@JQGX~C!DvM{i?lsvr5`<L7BzvUp)UzfOF-2S7C{yBnz-*NI
z0fK3QQA;`jBPrFQVdEIIj-5QL8X3jWZe6@}wXZ{g1JAS2Pxmddq4G9G)z{Z8dr7u?
zroAG`4;l_{M!ku9r@(Pj^(Oq{<*PfG<_hH1#q8+K5y2|>>;gkC4#q8o2RqL9NI50v
z%H4>pYgaa_PJ2}9n|++s(fbxn@ifX`8!mkH!=+LNz1MasZR)3L?3oqGHBZDR^}cH2
z_hrBh#46Pg*XD<xQ9&0nl!2hpa~fzPm4v;9g*1p{1@tzeL|;nqHncHLp)+K*7_DnL
z`A=S*U3-TzQGK<4$@6nP{ft{j{{l3~a_SpKy7<V<^kE1gP=08j_cz}>-6R2cKRrut
zt7NJ!nK-O-l~yg785rSS6J#7sbO^)v9yLP<Gh*lxeI^t?sU=Ddg$=J&zQ^4i3gE%k
zK%`#Am9&b&JIOs-fIePUc8x^Toqa{U;a(+#i(^VXDMlG}vDdt}HQFdgIIsX8_F6_r
zg?Iot`9!MQmKjd3|NW@hP#PKaPc+2VgJ!9p7`qV=qkQ=pqOjZMc-=yd&P_!n)D=Gd
z0iHcgBlyc+ULm6eZ!QV+mKkv$q8x)EQs14lp0%6db%HH=9ZM5-3-rScRg?7uKrwO@
zs)~&vV5iOf7k4JFE-v`n4q5l#Zpo}G;2CWysulq#fwNN~f}`OOROxQOK+O!vOdOD%
z9&iUD(F<wJhjyR~TPtDJ=^I+oW6Jz#4--WaeFH#s^(_xB(tqE6K$PZ}aO|M&LJmdY
zdzHZhitkdAENZ$)+RyY=em??2WqqQR-LjP+Rgrs{v9wz`_{n3m%4b?-1bDtb<oZOw
ztmBp0cx4$HH`2-^e6+7J=k4zgQ2PXMyI5?SRaei5k%loOGhFB%rk~)YbI<iL>&3+D
z>*u#pQ8lX_vVqC5eVE#ScP3SFX2j1iCGV5kS+0y(dqu|<z6s_M<wKs98PYzH1|L=u
z%FhIqTQpDDW$D<1`nH>eZwe6h#WmvX?kDhs-BhjIH*j`QM~6~C8;MS1dTt6g$oDwq
zon#=qPi=g%Ey~(HtuN9R&-GONFo3NW&2L2pp0CS3yZFpV9sm0GFYn7TpBCvYE_kOm
zxN)k!<nm3;dyNAMpAMuj446I?j8Bqo_LybG)>I$Lp4Fu2%!G{>H^r$|@gAM_08KMw
zjeHy~_4;l!PQRM?06@_mleil_-@;|k%~ubN+}roTcB^!!Oz)eDWXRhljBpPwU8p?<
z`lLX%g-EY%rI^?~e7x*T4jt-Vp!aUG;7!d5xqh`cMK=KCv|AD0YCHKhFz5XQeYy&D
z>{h`W&vi9fkK22qq)(~{Z?_EHY-xCNmEjAf#hWsK;b@r&qy(NPS-Q3i)T9BRxAYA-
zr0vs6Gb3@z>$dIYpu{ziK;+xg;ErEb;CeOgQL=xlWG@pDyu@v4RQTk04IGBlMR@i~
z@+DwIHx>@kf<>0z^I$KRG7Itz53O&wk~djRN@8A<7OJUVvKLIY)xl-$efv&*$he;!
z>q!is7PM($hoJ6*j7lY8OWGkGS>eZ?A+jqKcSmIRg6Whe%{3-Af!1UDqe~GfX={zw
z`ArxmE?&aamAtS_C|w*k1r-(B&GrcAeMt1Ca<B(|y{5qU-RTAte>|iljEa$e3r8MX
zO$fIG?Z)qNM%=$Ombmp?2n(bki*G|+3U9$0=Emy0<?0fc`v~CfsV>BT;so?a<mj{h
zQ46KTzg8mfpDWQobpc~b&6{Xmse!?nP(cgZU9tZW_~?!8<V)#L749a!eC2MH3$_O*
zLYD4AcKEv&P&DA3X;~t(4}Exs1Sf&WDr*1bi*;Y*({8$vE|!TR$68c;0@uj+>;Q`A
zN!YEK5nE*%S9XiqPJR%{Q*>zB53(eP!pul5sfi<)zX_bq;PiODH4DTV?-h&~VRFZ@
zHZ0XZ3%AJWr%JjgsuB2msia@n#v8e(dn3V!Tb+uRNHwb>5M;myxmcLAShIEz7yv$P
zsUd+EFN#8zBDSPhO>ACc55n!|rdm>&8e#dH_X0saGgKzM%KeudItd_^twjmZ)h>vG
zh9~=#N6d6lnqxRiF=7^sIX7{}+~mY+uZ(1}89_fiVhNdfuj~{y2C{kM*&{exze!8-
z114DKbiRFTTG<Eb2TfWzI+`$EqBe)p5W&^MLyg*CUvQ$F5*_F#l^$xg5y06k&a?$q
z4#2ly9VnFsdp+u@$LP>J<iwx^R{k0=EY^_fMm%r63!^C>x<b$~`;xm<1X;C&@I_Qk
zQsC?ABbLiEhd_s@UIZe$OMBY>#P6t^WZmXNH&(Zu)B_|V=YEr)6anZfTvz7<zk|@1
zlB;g|=a6sBT{4+KzmbDCEj$ptESWXCaK+rI;-Yi`?nV9i`{LN0+fyp#f>G1AC!z5f
zTh>wa4r>lS0N{oR!<TdT=AzZCW-=3c_r{qG*ByPdu=HJZ^QA%tCYq1KAxZdIz&<BO
zzW2tXvQbLx>DN!aMg~R3CTvP+&=VH}MuvqgF@pEZyK_G%p)*ROBKdl?y|-u%ga<`H
zqBb<3A|vW2^U_`$$tISem}oj>pJ@-Wj10O{?5-MV0O#BI&&_yDSk@Q?uWknu%T&~)
zx6*?a!IfoF>{wHg2c@G|?4wC@LFSv@=*zp3W^MNl{H@s@bQ8um5HVw^mDKk#i?mEW
zk8lrw-NXE4K*-k^(qm);=x9-)8}U(6XH0q=vN>?Diwm55%Rh9UL%_<fBOs71CWejr
zs>PY=E<Ano3jkpXc8y(hyK4BEEzrmvQKM>rUCaUU_8NBVv5;{$3G1{g4u4aQ2O~ft
zzS|DmE@d6FI0*ERtl_Su$ZF}D!e^=ry9#%zrh78<zmnc%vKtejXTr|vZX20CG?u(@
z6Z!Q?S%EGYCq8VhLET|n_;Szo&9xgsQ_W)}z8-`Z*Eob4w)J)a#aN~f)_7vPv9iJM
zyLAg8x=}FgnQv0Cyq=TY_t_EFTbO??8BfmP<q6WBic50A)qK<PnLKaCWU?Ik_+y{5
zzxU#u_;C|<VUad-i)KvbWB%B%{xUg|3KGB7G7)D33UN0!KPHo*40WL@^l8($y3qX|
zqz_0YF@cB~Ci!G*7Q8NdQhP3=(V3|d<L1Xp^mx#C+U`19d1=X@@kV9(H+KmR7sbdS
z7OC}H&6AXYGc^6{LL5iy_##5k$pBDRU!v5A@x{lLTf~ih1}5tkdVAzMw{i{uwj05s
zN2hm(5ymp?TjSXS7Ng^SN~l9<<46pevnwkT1ReMJns*HBM(F;5J*f?eMJEq~wRNgU
zce^X?*H)ckjD?M+8S(KO+=ZjmGt}6z;;#&Jy3rNwFzdE6`9walr@gKx{v}ooM#XGo
zK&;q{J3*MPolWXxq-{w^aR4<rB{ZsZgFFpFpVkBxq^)W(8QmW+?nsmHlB{I3+z|f<
z*g6JK(I;G%QmAp?G!67MFs{yihFL%)w1_CVr!VAc7JWPy2)F%;96xW*BhEXQ&l{>G
z-7BEr(|$Ne^Yk3zod5RW#mIS|#3ul0*qPqUm|c+|7Qkj>p%Bm2s(>xfTzKO9!~m7t
z`rRDojltVSQPHGAw*;L7qPcXmACoX-><U|N2Y+Uuj$CU@E<O7yOQ%!*%6JUm2lw2(
zK3NN81vhLb0t76=82^E<qPoFF0<W&3in`)hK)!d(HFMNb*dM*8aII{%e5B{}O=5F+
zFesWs^RWk`yz9C6$LXymTWA!3BZ(naakLE~C${ROrm6`*o663%(4<QXYCsd)Ins3m
z3x`J5_qA5V*x{v<9Ts9{uLDd<O>qYFu423Di}^{nsmMO@ibJ4f<14(`48FWNY~uQ8
ziBgU-EgOsC!?5??pHtIU7cEVF|KcQ~PEI4vs3@haQOQ+UbvO$RUKs3{8-kR5j#_F8
zl)=M1OWP86&^<~wCpm9Dy7D8hXfRJ-N&2X&T1Q;OkBQ%C+DKhy&)IxWcB+oFE5&W%
zW14=q3(3hIpoezEpkNX)s)>?X<KEQUHm@DeWl>%S8$%<KrmG{cPtOW8^p<3Regy0v
zG>ewLUEij4POE`VMIKO|7`(=7>BE}88<D=o5N5m`nXU0@D#$SC0O+ETDAtQZF7Aqc
zW>tp?8*`2oGVh5s?~(a|Fgn|6t~T3UEKsdEQGWNtOpm+o+2`e~rM@_wHzah-fa2eA
zw#lVcQimsAM4!GhrE8zRN0=lyMZ7X<b!f_U=cLLj{4<qGZzZzK2G+Z?xK<>-V!p7m
zz!eF*KMxQ@#e@KwK#+=HoB*TIv0!e-%D|_nk08j(@j7*<Ffr!oY)Kt<HK})#64?MA
z&-!rJZjdo|k$JrQX<DA=;gP{*(px#<RDCVgP79Ge`ju9$Rl^KYt`lpiMo_kc)gM}h
zUcx(Axl4=552|CjsMwyr`FL+4WV5;q9^>t?`%vGYeuCWo8DEjJ;a1JzlvfIdV1oqt
z8R<YO6|MiN2z!d}v3Vly=WWrKG6L~OuAm|Qr?Ow`q20?LB6rT<CeEhurxxy-hrwr8
z!*ozW(l@~C64F|mXrLqL1l&V^1)~t|QASM6gq$|telNM@6{OZ0Dtuvzv$3ENO&H~z
zjAGkE+!Asz=+d_J&I^axV#?@*e#oY`t&diBiS_O-`HYN(3=!tL8<Ut$<@(}FtCa9?
zD%TT!@VC@A;F+_&GTt8K@D}P9^UhYlbcry|B}B~2X13}FzB|_jWiQYJPaqAP=!5|T
zjCJM&BC%k0@G&{1VMC*VjyQC9NF*2`z-XU&4trfsajZYQtjjj5go~+bt}x$EtT>)}
zy=&DqY+J~5;Z%Lb^+~XK>Rh|e507rV_;R$%BT8rHD(bF>PPWZtCwNM&_tQSBC5TUU
z-Jvnt%AfZl2{gOjZ?EzYnP9<IM(WMs0!Sj$5j0nC84sB`T_D~K;!~TDZmkHX(XK0A
z6f`St*}cK-H;K!wZ%k;jgL(e2CWbIb)QO=|#^XS$5a|<MzTWCo1Abk>E{#)Jq>m=U
zDg2m0R4`sXP#4wtX+XW?ZRp*BIP)t>EKqQxB0VIiA%qjpt4Gk~D;e4Flq<4XLxzF@
zkyF@Gd1axRsIQ@zqC#vY6*sMGan}P;RDD$73qfB-n?FYSIcX4?d*fSg6W=S&Z5t7<
z+DzQVQ9?g|)5Rij6X3knZnYLTs03q2-MobL3T;oU;z-(Env;M+?9dK4CMZXT`pn4K
zJU>4NJz?d^^u#1kOr<7-?Lwm7!y=1m6{8ke6@acs9c^Z`*9cs$4CfBq2VgZ`2G}c3
zlGUMLf6BH^UZaI8*6g}BrhI(vb;Jr=my>ARd5d+N&C04>>t!}hq2!6ci}Zyg+!w#|
z*8Fq3ve?JokI%knSmsTdc0^Xkira6c(~54DiTBxQ#<GVWF9?j}^<fSof$r(calLQ9
z6R<nH@X5Yt-I@$EP3}(cFC)-8#akF$0WG9@34Y@dL9W9zO}2@x>r~cs)|~grWL5K)
z{4ksFz9Yq^A|tZ5PfrUfDq=hxcwv*Sd8R#yEX+y<y4ESD`#L~7ee?69*76qn6y==L
zNpGjbSG$7#A~=#=r;f7$6H&MQC!7aVrh+FFpW$WHnjg`JtaxGHD0p@8G;|o((ycn(
z*g&D{<0KzBLQ?T+U_m^^?vnib{STs(@H^tS=}&BKC~IyZ<d5FOaqDf|IMCv6$>=3t
z1#f(|RuccRZMm&9BeD`AM886E2k3S<l|ETKuFIO9-;kx9a$KX08Hm%JBFSR{4)lG~
z3E1H-JN;bX<+_v@rD(+)pznA1r7vkg7tEH6KZx6&ByLtL-+Y$cO|gUrXpTj}cy3RA
zVyZ->pC49-Bk_b8$Kt;OuSr66yq8i1ZELR3OAc;t59V8%SPt^bT?pH(bT|VTG73qr
z9WOGjmW{u@R^zh546Z-&{OZgKJdctHzKz7U!TC2Mkohjaw&TFEmJ4(o1l+&hbC<_z
z(d`K6=?ipwOSq;eXzhLNrhrwsGiq3qf2ONTEAL6qVQ#y;P?g#_3&@^@AAE|NAZ8sV
zG;_013+R~sG%7>eA*H3gg6we{4Nldar%?KZjlC7KZ_{ss=VuE9CItTd-4XZw0QzBE
z6WH(OTN}Ke-v2$dY8@aT0=7PQOm6*iSEb(^^aE_<YrisSu3h{P`n!*Q{`IZYFEehN
zdi7G}Z^%T1e!sAH2wyUmUjLgvE0G5tMgnwPr%{m|bUx}tIszi9YR~=W*Q%MyvJ_)9
zej&XjFXnuEk|sQiy7<sGk}zRwVw>TjsT}Jm9@a!u^;=8YYo9Cagb8T!t?(Jq+vGmD
zrvkKWrn72aWmuEjJNSH3qA&VjxqS>y2F|`_zO9xTvfY_Rkv@sl7sT&wtvUH&BU!CS
zN%x!+j`ir55qKBR4Ks_iaFXO{6`~@EfA50-kerY3e39G6zWNh*oF2-ss3hKvyz^)$
z;=pTvRqJReEzfZz1y=nIo{s=sV<Q)ARA_T*Kht=?`pY2R%mpZ83DNEL$q~UaIA=G*
z$OX6ArWu+Yew{&+OY;5rNk>=U3@z$;Bpay;S5;0(=avpL<hIUsoC}6{_L@0-O2AMf
zOZ9d~B-<{-EA<wv8%m}T)Z;f~&<Yx+)4djsyGEjt0j%-io2&e_JILNsUf?MOQ9zU#
z`ypEda5sE*HsK@84~`{HI*aWD1^oTyS|Z*WL@F>7mpx{E^Kd>=`Ho(^u%H0*oj6mn
zj;8z%!MCqhGe<q4G!Iq268w!N;bAGiwdu<z4|zM7BLnq_<ypDZ3S!~&rCHBF$8F45
z0FR1XL?&g~<n%*Z^<Xklh1Q-O9bKPTJUYKWbiFvTn<g(f=^S3pGt~c3OlcU^*WydA
z#`UXFze_l*hGeODb-AE6`?KNmQ_60bp~jky7J3R=wtJy(T?Bu#rhjQpvQy<nT75=K
zJB2x)^xG{4M{Dou;!$F7vV26Ef`6b2i&<iP@cQMg3a$}T`@p`QoHEnNQ)ODw?Q%Kb
zCfYn3t)*H1+$j-0ccv^DagF?XF4=V+K2(i<;EU^DUeCt98~4xFg+06UVf=Z_(9k4j
z-srK$k9S%V6%{Y?vN^3FkID<=8r_OJgNd}l3kdW%NGKbh;NeCo-*cN4I&4E;Vdm&l
zVa4=_ZA%~ZbvO60!IOez=C0}Qv0HFhWE#)mSABlmMNO{!>^|E(9{G*$gkp^kFFDJp
z@~h*dMEv`0g@)v(y;fpt0|AcOU3zJ(o-8dAAJN(9P#y;gI0gJi@q$-B8{2$9GVsqm
z75>3Q%K^zo8MxxN+2TLHR{ciE%9&2?=m)&b3{v%uO<pg^F71nqs;_u9%yoN;u$8YB
zY!jUMJ@fnfH$2EFX|daE^UR#-)`fI`Gp-{?IkCKjd^Pe;Jst~4;&RNj&4AgsS&_;X
z^=0+tN6oRD3Tep^<c?%Fz6+0B{nr5gFs>+Xv28uaQdn%Kw36z<u!deyfIHjyq)J%A
z<ih3ns4KnIj)9p)M16i;Snc{d!~ATo`7XkR{Ma&S6?Th?<bBHw9l1L4cc6F3Q8M|D
z@*k;4^c&b9j&iEs6rSB5F_8G3VSXOh&O(btN5|B2P7Jr$n7)!(J=tu^Q>+HIEmo9B
zim3k8=#JD%6ghCI4BVQ<@jqR#U&j^6#}-}oy!ZI-$K)Z$;ZMPagxjj@P!6bx5^W%T
zpy6Gcqtv|)LcrYWI4_(~f4X45j;kY%JdK6T%lgZD*}N&3CuU#qt()Ao5+FpJW#41p
z%P{Ub%u)l^Sqxa>L~H#2J4f=Q@cjRmBiT+ovu<r=>DdgvdXn(vS!ZHmq7Aa4eqnn(
zG?@63m;>3&^{DSn1^oY$7d4q3Wi+vRknO8V%;Lj0?q*Tv$Hk0|LNn<!557%V33?sT
zB8umVw4>QO#Vag6*getL8ausbJ;<`d4~U>--+A2s#q9HyBb&vfR%`k4;aMzE9j+(U
zp`n&}MMW@(r;e_krJ4t~mkC*bU-GwX-{43iKZUC}blWF?euGa6v#r5~M!Ax-pDUCy
z?-r(coGOT?RHp1pptc&C^L>gqtC_s=I^HE(CBdv3SQN<;++-20=^T@$p%OH<$KN^b
zWmr{BMAZ*HjCe`^i<?qcr>CF1T60wrKBKBWsAEY=yKunC*QIw{0~tjq1jsAP5yP5V
z{%>AzK8s3Ee^GB1YO63*t(L9Q-f0?0@`X0KY|n+J7#2kkE-PE>j?&Nv>5yMV6t9BR
z&F1jK&c8UQ3>LLaEq{JH7Jhixi;IJI?f!*7{5Xie0K}qAdSY^#+pjO+5-|S$$NiCO
z=|I>+Q7g=I|Jenu-8Tv+Jh#C{34h7;Ke+&KQD+jIcSv4cEcB_qb-2{&nzCFNy;SFA
z66z{MdH(Uq+QF(dSApn<Voms|Fc&ZH6w0LP;$K`z?bj<c)F0E)_%sD5&o+4O=&T1h
z6(VepRTI1uwRGT#)yTEH+=4otqDko-p^c}XeVW;q3M?D(qD)I$fK@3g?N5ETy&aIu
zPQn^*k9u{P{}1sbYb_xkscn)6%P-;iA}&?^LYXt_#=R`Zi2Y5im_tKppVI@6DK4vA
z+wJk}%7#ML&8672H>WqW?m?$TY1D-!M|u(x`gVB->(jiJF6kFreLS(;t@W66oV2%3
z^S9~$9_-pZEl_Q@v3IK#OvMNF4|oQz>ptFFi4x%k*YD#?I5g>$!rX>tMbPFLS=*GD
z*w}k#j~(xLHQ4H9X>cH_h0HK}h2Qi9OJJ1Xcq1|ceFKSOy37CGync?+zwT*(%gd^x
zJ9A=&Gs}Zm63_S+59)-osJY!`>Nbm$7mE6P_<$+Nu1J7~yty{iZ5{<@97O2W+)nXG
zlXh0@-5FW(pjrh!_u3VL>E1~w&Ny(;*EEUBPD1iY9$<O(PBpNU_qQe1N)rxxz{v@R
za`4$)>-ECg&5o%lt@p^#B&#I8^gBwdQDaWFeHkSJwxOXUm0;u)aF4gO1o|b525-Gp
zcr~LP|37&#`D1>Jq{}AB78bd9mRZaMUU42*r12UDV#~sebS-Y$k`xeJ^2Sb6Sro^0
z0wiANI7jWTRj2h(y9Cpig-iF<K0R!B)!16O(d?rAY@&Dg&}1lwwG8J5{`iD~h-pe~
zr{65>!aJn@W!hJ2JRX8eYX{K1AM&oFGGVV`J{h!bCJI}lvg33{OBeXYhYR#==RYvn
z%ztCD9sS-s5C7bAG^5gUIA*@oCpt3azN_N3aYSXakc&k4o?sC1izBqs9{mqJl=H~H
z?KXn$)qxild=N@c@s?cf!__*{zD~tId?2fuLCs^W{5M;0MAQa&2VKKfP_FX@nt_TR
z1n0q`E+;dFZ;jnROK$E`zA$CUrsHa&lY0R1pY+5U92y@i@758!Y({OyPhb&4bX;R}
zHgmn@QjWtX8_m2<S!h&K>*nns?|bCYu&LwB$^G{T)Uv=asAvPTaM5*aL1%P(4*m*Y
z$#qPeMYV25W~+_C8l;#kmU|PWdwA3K(+cb)Ue3Qllv|dixb=>?uBm~oUG%pa704S*
z&mg;@g2>6QOCkmbIq1;EaE7ay|HTAn%eeQ>rvrWm;@O6HYGPLp6Ql$<tgN62avB%s
z@LrpGH<#WGJ~!fb$d!TK;)FOuyLQMnu`5E&hntl6l&os{)D3y$lq8O#NkC+_g7>+K
z#yLO|JVJoFzvJF^7NNGfx^W+$zTJqS2%FH^yplrItVopr`x`dlvp2xAGYh2lws5_i
zXXX;xCww+1UFSc@n-1Ha1oeTd)>XD?dTz_mJ{EpH9RD{7#cj4pWQ)ber82H9kE!!)
z%X7iaraxhltreVFq*soHEc;??=GEIx4O5MecGdK?wBYNR2486EC|U-TsK%!IpuA4{
z<!C8P@~r~|i`rNVpIULXNN-17TOndP?oj4cT<@{rV)KxXyA(!)tPm}=kQcT7X06D@
z4VM0iVf#oR0eQK>dC_fs9h?$VU%*40hO{3`niWZug^Gq)mFElmAqxJydDg&#`*4RW
zbf$OfIDm9&zjJdmU>5csKG;kSfBtHu`_y+*U{ker%g?96r<T#X<BiW*ud@EuvWe@$
zq4`+3P|oPr+dgRuvH(EFvOx~_9K0$vzsbxJbXDSxCMTcXo;8i6`_o0&!*~Q36C8?Z
zDk-3MIyx*Y_u8mO_QreGyl`n<D6m6J;!DG4N<~`1cYUz-H-}#7nVhHCKWCCZW!?eF
z&OYR6mvZ|Gzb<)b0$bE-46=l<6^ugx&qI2&he<&F_ECs-L+_beKwzr$*fpntns!;A
zHfWzjqUznUDd03yUVUNI5F6H8;QH;v{q-?T4ae1$fps^&`ecuusp$$Ye-Rxl?+Yvq
z&D~c<dF>M(Bi^+;t7G@}_cT$fdC#HxRYP>H+rIyBlTiBq)=hj@f8!={+xiz;!CTo<
zkky1rY-`;5FvCe)ihGkgW{hrEu;>S7zvJxXNKb?K?$Fsh7<;;n8gj)3vzgiH?;a!-
z7%tuxvN;X%;&{6$5?7^}*flZTa|5o%=g}{Hvf?i!bQmtN+0b5Cw@UpEgx}xBB$Llh
z!TLAJ`aewE?+O@~vvt$pNDjRR>~%+7lgzAMreCeGi^d@hZQv~p(ndtod#LqNZ`Iew
zbi(}`$E|et%-2N`#WPY~>pz0liy!D40-a)7!4DqzLlz^N1;arH6Pm7HakLU#_83gg
zjzqoOCeu(K@i!`Fg3dG-S>GW)M<n#I5gjaw#AI5|1vUT2QZ5U{D%~ZQcGip9tvd<@
zLFaUe(!*5Hp-9}LP-J?`33j<80j_I1Y$jxTP%(n|{xN90NuItNx*(&6y)2R}cyu?f
z5GuT@-`EJomq$)0J;5t8C?f6#V=G@Bd1n}b-yxTUJ4l1nLt};i)?^9@6>rMV(q}1%
zf4Jg}!E;yirGPia9mX<DT8RM1od;ZyfzS~|Rxqd+nw*EOM;)XgTx6<lJEbjy_km}^
zG^j}1<`%rbz+Jn4n5_4D$aHNqgR$lug2ZWR6z6eBh33C;Fk6vrz4T+On_b$H3Xodo
z={#*`rGQ_0hJAciTDi01sJ~rHm7kw~7ZcN`g}o;%Jk~12R~E$Jan}icz7xj8#2g&c
zfX$^(yCWJ8rcVydPaQ>J*ISFCUWpz5YLi#v=o$XpAEj+Shmb#PVwSb%F=YwvggFoF
z??Cl_;`ctHQGUPdtF{wpzOj#K7<@19ndX9qQlVb>cj#`*9f>6bvOIz6Og<0ccmv)@
zr|~8F1kHA4q7)~c!sG3ai(bx@M}#=_mE`6^3l1DwH_O!cD*Z2CdF6t@dTo?#8ah;@
zh}q`8*q-cqK3Q2y>J4o+0}~CtIz`{+`i~=CIc1e5ewOyaw{JHGNQ#HJ;3nk1WVWvB
zN@JDs5cCXX9#S2Q*@S@*^u_p_6%LvOH>l$7!r6d_c|JA5hd0)p=REHJ&pA(igL@DQ
z8QmHYwFb#>SEr2){6`pv*DrhI=2+L#=o>npij0Tq2TqoKcP1k$b4yQbhd(RL8~;1y
zDctDO9u%;%wz4V3@ggm*j(Torr3D~F_qQ=;`Dj#2{@B4W-2sq%?k|5RHx(Q!)U>ow
z)`vjqQ3JJ2or+$aCSx>Fj1=<^c}bL`@yL}O36|e({vP}IH88Ifis``%+6>3a`xPTu
z65LL@ch&k=%2D}9%b-I#^Aj(v4mybICFwq|M=BLP`oc&umf-GM@0YbV?`9|EJ6L3@
zFo?H4ent}Kbu76lH;JisGb~O@t8OK0eWX2zol1o*BGt;BIc=%vy&C9*+?BoPsk<QO
zyOarGBIbb~xQ4-YatgacPGUEhV^VrVXjHUQnw(vPcwL|J(7lDZ+@4E0`TycYo}4ft
zQS*@g@M!F_6wI@6=X_=D(TGl2F(nYpSB*Svi7p!ceuTGT-$i&s({iB1=TS^3gD9`X
z%Gy030|=~fdwR;NTk-w0{OCpdV9s14<Z7wH12)%=ei1a@Ib?yLFx?3Fvy$urZXnZn
zO{_0!xuAUgPl~#0_tRBy&r=LrA|f}rKNfvJ9p~G0{k*K>NiKKH`D4*{{;l6xan5VU
zdzS(w{-QFRA^4^CP1H{FNn-U{iz6dfj_e>q<kfWp{=wPSPVSg-H{PhJBJ<YQKaT^p
z9UaHE!j+y~)QHI30TNe%FTYxF7_Or=<#l8AKbBba5KoNcW}U9U#4i}ZgYM_2Z_}R~
zrC0VUDk&9IiT)^*5s6V8>rLT6d~$o#i~GL5Vz3!6YWmLH_z$q~-)Czm5yE#(I`<07
z>9eJ{KfD5w{)n(Do<0Ep0>@bR`RdvC0<QYbi$Y&L<B7VPfPzRCkNZE1r77upNa`W4
zs7ZD3IYJkke#z%sn@WZDvuCCqrlk*j%uP(jscC5bpRtv5AjUz5wa-r19AQ%%bN4JQ
zg3d$f(}4E)=s?>64G$^bV7&!jnu#z1S@uu?^Ufasd$e6CRO+xyFO%0HbN$ECFC%rM
z{1ip`3j+9PlaFQ!wzFgCGmr*zS-U5Zj{IawdeFv9P2@=SAM>sA^tU4}s(nPtGP_=J
zALplXgnh8SPv7}NOtfo0fg1tIK8fqvw$o(LSZ3d^i^#3Y#`6nM_nv-%d%@-$sEhxv
zfV!2CWHdK1u?skj<<qa%0{;O$6rWQ_yAmlYc=H??W%&=tC?)0U6ab8-d13Z|k~ner
zU)X4WXg|+6HroAPVWZBE0o*q*um;u_Iq<8MVSfN4Q?|3zE_X2A3IQ<0HL}0O5Pv^M
z73+UNtt*dLD9@o*^ZyEJ6=!0T?rM^oL|AmJIDylqr2F*$fdBTo_p|w%MqGIeVB0Ri
zf1P3ff^GkHjyb~rLbshWozKy2a-qLNx9N4)Q5P;;;81ud`|Mu`e98y%G&AFm8>q7R
zy=s^mIBlr_fR>|rxuIvI7cQKgl@HC<{j-4pYLd{KV*jXpn~hC@|Lq;Q`_Hb~6i`sC
z;e39}p8iT|O)EcLyDm?wgy<a={pVIsYpwj*qr(Qix*yMpiCR5h8(qSCh!=eSTgg$M
z&<sqdqbzCtGOO{75T65UUvF=3!{J!ZVl6zSBlm#Svdywh2l?a>1+#6F8m+QBt__rV
z(iQv2+U1i@zAgvdIM}$du~L9g<PwBz__H36{BRj@?GdtSf7M<lSI&Q3@Ey=a;OKu;
z<1fLj1Rf;$@{$dUUYexL;SCOU&SIS>nHrU)%2zk;jv6p&!XU?aONw@~h1D`E6r5e0
z3kR}uJz5zPuF+HK8!%a`Sve>3G(9}H3ig%AZqM~zvfelP{9}CP#{tqG)tYc!6PB+2
z-S=jT9W!?p^J~KB%)Z@PsLb38bA+RWK3a0&!9&otrD06pnZ6T?=sRKiKjE*)dh&A{
z#d#RM1O^-^-Pl4jN(Au>zEOPR_@^00?khwa8|T<bbVdku+RCrcEkF@=w&O&Ne2w5J
z7ut_BAN8xoB2QlCs4bHpGoN2?<J<s$dA-C;wTvsoLM{mPH_7UD5{jGbhX`r%#7em>
zr7eUh9n8H$u%n}6|I|!m^&S@|=R;EB$x0P#CrD*zur<+fivpgLGA=PJAUKL(F&>Z7
zj*y(~dba=}_XHWM>YaEKGTkZ`VAJPsXD+r^0x&0|Fa@KTSRk4<)=5XXQL4t4CJ#lX
zOjglmlxAqW%X)fTu}L#AotUjWc`!=a*3mSCRMK{htycR&@iIn$gTsa`^El*go_sZm
zy*_gS>_6CY$q(d*WVNo=GRretDb?uc>x-(Zt1GvI<#Mu`nVFU9t-a*neq~(PRVnZz
zCta;u^CG#DA0aCto=xz`U-(L(v;xxfwDXdnOUK=gp053~F&^fkmX`t?d|Yvcww{XZ
z8DwQIbL=p4mo!bA_JSi*l2B(tZuzNlF8R-MJM&E4!#|c<ckr6`u*2xG-J&tJ5s6jz
z&#jro^9cvl$EB?hc=$z6Tr>6XPQ5}`Q^3a}#8reVStD)K*Crn0S!O>mR^LE<0LA_v
znzqn)CV!#K%;S;eQ)S~XT81UgwnHq&%WH+HUl7CTyA@(lrqC5!Hyw>cH*Ve!zA5<3
zS0Iy@|LN*wmSJM&KIF7V2Mhl5Z0I`CH7ptS@u;B<^&jx<Um)wm2d}5&reR{oVTgx+
zo(&OPB7hP?2keS~CwJ>9*8A|hf0w0|r)>#J<N5<4{>vclm*e8W*Yvh918Q9h2}`Mm
z4Esnrk1C2Al!;f}cMIH1H|jigx<EF3wVRcB)!x7%@lKOc(GykIN?Nz|ACah@kp*W=
zid)ydNJyNfd@?tcq5V|N#9hQ+WNR*r_qS?OFTsJ@s~;5yKVTRSCY@k|VD|2j?t)!6
zxs+nD>=K)UnyH?%>P|-kebQ_`(wlN)H3Ql^z4}E-T_csn_Zs;uZdM$}8%4&&aV3>=
zM>qLVQktj)N|&4`X-@427g&EEoqoMJ6*(b-J`1=B72cKHMeG$cpFj0;7U|YhuHK=0
zuNYZ)W1&*UkpGckl90k;9PblPOfc`VuECv)5~L9?lw1{@OF&(NKs-3v7}@L^7)Xmb
zJ3-rOz#dZBlpPH_>V`is-9#NIJ8xfp!GwO%=LbSnYO2X78A4DbVoU2n3u+c=>UlWu
zQ_sqEkylUZ4pySWO$Su08SG}7-aqb|J3Gv}A~EBB%c-Mv+ht@(&cq)?Vj0WJ731fJ
z+tHx_rf_`pC@?xs=bL%Kd-69XHi*k_fUK|2BUR!chV(D*v-1$w`DUDrnnLx3pvn&M
z&cJD#quHbEW#F;do~&1VGAAl8myzeFMJHovJ34zyNp+=Sbj_6akX!T*$lt&dYJe~x
zyjQ=1(r1?7(=Y9xi(SpN3ideb9b3u|<;Aj~Uy%AE<>?^?y!29!T_;_rJg^^vD-1d5
z<I%+-)$5(^s9ps4gY3n__h<RU^@kJkl)MJahZB&XE2C}<JOu+^N*Xt3S-R@jEMn&u
z7KE*Qa&up5XlZfSBFgWLSRmr7fQa&^!R<fY%9aoAdRWYu>T%>Tk6>6$O>%U(Subhv
zWPvaZi>vB(UhDXCrj5CefY37a^&Tv0sKm+=`BLfDkVO_(>(VdN?t>iTCSV2(Iyx1E
z_FrT^f5FrL#hvSx&*;9xQmC=-w42lwDEw&Ar{4$O2uLswWzwD)8_U*FsYx$5C+sci
z_e0u29U*<ETn~JFLJT~P;?WDll-$wMUi*hWsiz(Atg0$e=-64qi8ia+>C-95CInu2
zXy~QLu=$h>VOQqjowDUeFOQyd10Du91=V>uB(PGktGW~PvAv@uh{1MH01DSf`<L73
zQ8WaX$Nh8LE^Pnrw{06VYhNGa5z#xpiRP)fH(X|1UGvkb!eWZ<DE5Eu+H*}-u<#hO
z7)MO{_C`Be64+<64`&YPQK5x)2H!S}@;Xg+1{K1q8ARTRHEw#|#9A#?tJj80Vbj+u
z5dflNQ14lRb!<<;F0j%2=!QwIidrHYQoPZp2&l^0A(oi0V{9pzt#-Y%Omcg)dAla{
z+D4X4D)pIIUBt3((?E_&+=FmY@w!C#L{875p!@gJo$t-z*$_vOCcUOH`v=>XdGpoF
zLjE>0`NzFqDjh7y9pZ>cpzeKKja2s}$Br*O<GkUA+`o&ickaHiGyNd^+tE@AlST5q
zCLivzqaX13QDoXR8N7$^Q%o1kX{jS?#4wWgg*ax7xn|1Z?8M;eF>2;?fsI5)_Nw&q
zeJ~!lLh@*E0QwqHYNq6|_@zB-%@uL9#(jM1b<1(f_>^$|U=$)Ec9dmY8Y;qxo(uo<
zZPdE0<J}D|?7k|UL#cs#qsOTu=NS{41x<3OPzpNUBZSDM1zcJe?4$ehtm}7kQ@{NA
z7vCj>qMSHmh=2v5#;$fu?lFUbheI)up3WJbmDJ6&CCyh#Y(&22qvr6Dw5&1^{y*)#
zcT|(<`ZYX`ZInSA3ydNlBA`@3B?3|u1nDXwQlrvDN|0h8kVHXX6ancXA}Z2Llukm3
zfb=E^L`o8R3lIn;A@zH}Gmf64=gj$j@At0nUF-eFh48FAcfGE?_qFdkE0*QZYK;ml
zHS1|1>d;kWGMuKNIo`6WvlfJV{W6{-T9akw`0BZ~aw5l7hyvZVbpJU&v9aC>+nv1k
zbt4&J$X**LNemx>xmYq+6nC0C6VsV(=0Po^VYSX3Kvq9E*)L8Hw^Ay4JR@*GR8rKb
z3_2O}MyFNr2Z8!eRCd@W=15KTk<#R>A=g-@P#UNT1vgH+Buck22_iW(BchX$g`wQv
z5vyRzO#JGq=eskZ4Fcc*aa6_9Gu92JJC(?c8RM%lUNIi*A*n|7&r;d6FbA5tzkhv)
z+tCzb_IXb)PZpW$NUP*b67XQSsCqX3WGIhkO=!re#Tl=$+63FEW_iqejdYY1zBTeR
z<5Z&J*zO(6gPNC~EE<pwUH=#K_&t35+I^S9)!zYd`s;-?82HW7>)uM47mJKCQBNL^
zBoeaibbIq?wy)|xvFRxkgDY3!W8>l)cMzZ}B2K)a%cm+cl5dwB@O^i%d^SFbg%&Qk
z9;wb|Ij9MHAZ(xGW;hw44?RA%$UD)mzg4~eUW|{ewRC~cCqp3tEY5eDzOxEq^8|(%
zPpGV|`U>!VugRYgtsY?wTQ|8m-8v;WhR~fdns-St&AR*x0zWcH8@F;#SU_UV$)V>1
zjvhU_VA6Mm=E0ls3>H$ssY{|x*6=mBpm3rzBVWz@a)!S0c%~S;p4*IaY#Q8%B+Em|
zmR`S-JnSxCF<T7{`Oy3vK~+E&dC;EY79vNO1IJAoP#DVZwghnHZ5C;?r+@A+{iI?e
za9c>J(vyFSxBu);R+9EUejNbFZtOB70BmCuZbdmxKNtwyI}ltohiul|B*}owVZUx2
zPio$6qApA0u#J21%wD5Nb<TZj?*(zsp2UnsX;g*8aVNMe1h<;)TDaW9k=na=ZvlIU
z8f)w*_o+;hf4}oh2794qG>A_ldI1y>qs6EEDR-{g(Rj}BW;8!N4dQ(42TbG7mVQPn
zmq0%XP^aj;p(U^Z;$G=14NlxdsdK@>3-xz6EQ)<QVk1jSQ^tatiac8aCBoDY<#J_O
zIs<o_eJRIw2D#Xjz?N?TNs7b>_5I|Ik>fbvZGfcjhgVY^eOKj4ZXI#S<BmjXG!fZb
z8O*cuR$=Kx5unL_|6P;+HSQc>O>dmk!B11w*(=f8XvDm*;`Dn#d{kY=t%ds<zs5Do
z37L_pn7K;bd?9Em^7qhCk!J_hV5~lzb<k*-j*V11ZvIl98<O50Ia>CzhUFtCc-%5X
z82V_`SMnhf@K0jxe&Om7Q&{(q`>Igwk2|?Qs}ujbR{v`zI1SV;hjbm5(h``FV{r*!
zDIj;}`dJecpv!?cl26hM=o-nA3^0||#Z`f(!glN+z7&Xe-jg5BaE^~0M~>!4NFb;S
zp<@ELPwEJ)l{-d@qr!3II$;AavntI?Q^#2;P-0dFvQs&bbjmzvZ8dBEPggS^!m0ha
z*v2iwlN#|ucC-+Yfk>{}xd;`<Oz=~sWijXOY%}@|WO+q}wL6w=>_-M5eVr3G9ISqG
z5aG%3n>df3y_G^Ysu>1m!~D7b(B{?QFcfRKzo^$bA3dy?sOA)5jjZui9x3{b<1-@Y
za%~7u3w%=}!uDUy;e@S@Im7?nuqy@pYcQ8RpLQ0Y16y%fr~jDBFLdoS;anH&EAGEU
zrBe4-Fo0WMUcV~1)aO>7X7Au|vJ6qMmtWpuTuAW{o|%yB8V4i8T1KX)Z#nm;7h6QS
z*$qDpR0o*ve*%a9N}<zuJ4Ta(W71@titU|1a?+W(nX!kC#v*2!D(UpoO>U9wYtLk?
z*;soAkeuWLv%1%>-y}bpKCW1aa~EBQMCB&ngI)#`e&w;I`Vd<iGudRN*~24z7<H_)
zBfW1EPVoACzqJ}B+qGE6=8Dwns^8JgZA0wb?1y?57KyGs=&Rd#Ebq%x6MB^-`hHn@
z;CJiV4ZUMkhwt5$U4Z={$GB#GW;1B}r=#Oz4DO7YiERf&Iw2v>0HvgsW_R&{g+h}X
zvf|o9!zbz&3%m;1$niSz(aZJOY1tL}A++D6F!3`tdRo448Y2klP_ME@^cdT~iCVW)
zKlhNt#Ee(`43_YG%KGF8UL3$BZk-Z6cULC%=De<EYRe@bZD($N^S_E>C*FGXC&A9b
zNFQyr8ry4tzhbj1q|$xkMR%)>efV+1=+!iyf!4GWl+VQM{O=4jul+P2`}EAyrl#7P
zxCmB{LfQ$E<6_>}8{tq_@0Y0IHBOzrbojdXcYR|!8xCw(lQ>$YuB`0&KI^`;>mbl|
zqpXWpw|)NsMcp-84)Q|Bsh#^iEsx!_M$1ia?YZ&;UflBA+B@7j-CMhkKPn)V7y+{{
zFK@2oY;h!bv#d<r)9vsZKq9$65iz^L@GsfzPt~d5c47;-T+>lDMYdU5e^v<fEw!yJ
zk!`K#NpEoRl4xXgZeFQ|NeP7+*k7C2uqLGF;b99k38R$)l!U}ZM+qCrj?ILUX$i?4
z`y{krB2OlVdC@xSVij-x_4-bSv`ZH*98^~Bbtbrf%}EUbP6~LqUYRHYoHPyaaD7)N
z{IkK)l@GQQnkE>=umS@b+l=Kyfi1U(jn6S^zdt13UvjT3r1HnSbU(w^8-E0XA?kGY
z7o9JrfelBW{$>Y4&nK*@BhNDkXza~}Xou*yIB`EezwkZ}Gc&{NY^gN2q@HnxtKe?@
zo~8d<PWuv6{NNH4nP)Q64soL}(iPX1Jz=%4Ut|X_xsdSI$!=CLZ$%!(Y|i1=yW<WM
z#nj|Qm>Dqnt(r2`#cYnMYus46s7O|YyoR6wQ7TY?b7%I0(esMw+vdGT#y8;r6|`rP
zB+EKuSt4VZ({J_mMw<6cTyXD}{<^~hdzSRBraJEX597KPEaL3pRMvp`>lc~tY(>NM
zdz%!M%RXN7;w^DAGDa?2H_F}wsM}rX&sr=Ya=|b1x~jnyV^+P6>}B%@hB$7Fjt$5Z
zrM*7qSc6jrrv%+g>~T+~b_1g9Hl9xo&sD!KuzbetapRM_t1SfEbezuuUno^s4oI<U
z9Shn7+XNeObcq0X%|W&Ed?9PR#^B$r68$yKHfrCmbXkI4jO`uRyDmkN&zuFFE%hiA
zXVw~~e2@f2<(=H(z`uo9Cv;PGw)J@^>F*8%_tRQ!MAx=jf$-t~SK6?sWPiy^#VXWn
z>v;ZJXi>7@+lBrO9h@ZlU#ZsjJ$gb4FFxJL>Z^pzeHNFO58e~LXIs|$bR<C?7@*Fe
z>l-jFi@W}v_#T}Lh|9{oCA@Ll5N;49Xz<zwXoNlf5dJ}Sz_k&f@KF*Vk-PZcG@pk4
zYt;BEv$S?d-Y-;o7T$S(5WfQVGG7Z<Nx56ME&Z}o-P&^iw*-jikA;6-oBV`-JNfqT
zT@DS6C2pC9^Dh2{Unc*)`+fHzM}w8HL_pRD$lqO?@$#U5mfpVx#Lf}wqR)x}-Y2mM
zS3*g`e3r}A&cD!oA>dvzPERud259Np+T>Tf|Gtv{`Qr|gV~%JUm$+#;0F$5e*W`PP
zc>{%k0&vUUW!YX!+lF#^ol;MT(u?7wKUd@0tz>$}#`!dP%*9fRix)+^ySqF8zZdYu
zfz4cpIA+YB&#^5iD12lt6$}V>`rG>(fk@Ljt@}t_-w_TneSJHLKZ}2=?`6_yzwQyo
zenHQB>nnueZ`OOu0-bxAy0{4B8Tq{ayl=3`6LNu@VbRga-HToC-mjU^f8Jm<y!=Db
z*a=F+dEPSwG)B)wPd4%nPownPtA<U@O=;#y&pY2{zRzta$!lE8K=-G1i>reAxlSLZ
z{{@N!tYx8B7#+Wt1<;G=A(Q~)O1*aeK7}hGOX?q7{k7!Qx0^H4MU%Ps(CpF>{8oHh
z>;(2aq_f}{Aj6l`lq7$z5b`B*|1H_yMN`#f)z!lG;{H9RS8v6c%h*`?=m9Vzr_c>3
zyqsjg-P#T(g3$+$q`&EUTc*9`j_~7SOFriKdD`dvSrLVEHvC8WEa?cY)L#puNp+^d
zX5TkB9NfJQ4UWGw>DB!{KsmoI`h&vnTsQmv0}Y!t1d_rJ(`}a6v;vQ+vs1l=x)Mv`
z%s;+gWpEJ%BzWO1ID-V)n2G1ew^gA&I5^XwK0;`}HDr}K)>(+3<G@BB2P8v<Jw1Z(
z*Ej#*wbsCEmygktmB}vqPSIa%!Aw^n2Y`DqX9<Ha4LKVr%uHWBnDR6S6>ArvQcy+K
zF8&!1?hF1q;l8)ba2#cQurR(oer#{rN(A22`SYYiMVu4Y!#|{A;jzr*tbUGf)gHfp
z%*~Wt^kiT}t+?Ww#h-eM?Gv;Gn8inoY+3W-<&;{c!+1ra9z^4NAZLw=2-x@{I=7sD
zFIe91-YgqqD_l7kCSMs_zBsPO<uK2?8ynMKNm%s=P}7?A(_XyL^z<zFh$cLIxc#U+
z>T#>3faI_BpGtUt1ze~p_NSpU27ovJpK7IlVxaY0JwCIWcQIWqQDSxTYIJfkk+c}M
zH|`Y|Ry>t>j1^9W;E&K$O-u7$Qr32kq=qiA*<Dk+O#u?3&E=&ioVZRGOnVSgDL^>c
z)b9k@`mx_F>J|m}q~WAkoxAstJfHyzv)U4u{nSj#ThQO2qJ`}2Czs94^!t_aT9*Oh
zkq>P5zgb)Sc1zuoTdy?673h0nA<{~Y4{L8+y3l<VC^fp|3y+Z&FU~>Jzn0u>?^1-z
zrmq$kLEfeTEUGhZc=3o)#P9If7Dk)kRFeB7d8Lg9iMcZ=VPd;nmgBm|E0Dx{kj@?o
z758j*gRWJoJ?ossMjvE6k7|t3*s1ouMr=2CXlovHU=?anb~EZ3tf}$RrOrx=r%ZsW
z(wSvSpi1CdVy8YJcnY_bgzJ?Z{af;*J^Pp+Vov(fh0E8V5`W>S@FU#kk)Aj}%FDpP
z@<;hk$i0K|**aLH4XEF&U@E9bcD}BElPvBci+g8lBd*Bim<%&93Nkxc?mtygKqQt4
zg97@*V`im~!_s0CY!N4kn3Q(<dyS&Ae+tb8?HaPGGxN>#F{ARGW5Asj5`ZAA2-#7y
z|77!jkPBj#YYsPQ$~WOAQU@r81fW(1Xr^Wl(xc60jXGRaiu075rfo>VAtrP2O)rJ5
z=gB30fXbyuQM*IiND{`)%?X)+bbmo48&j1bM{@uD+WoU^t~V_K)V4R_?(Feili2{F
zEm6cMco6i!<rJO0sO%(eZJ;|l2f7C47I@72vwh5)qjV2A=4;KnoHx7&W`t<}Jpo}&
zAp7Gm0Nr?@Hwv@@Ju*YzT$*lfRi2C+1T~KA*@1}3J+xK$*m-x%m;`s&V_wycvB%ls
zvVFeJpDzNi&412iYcL6bRlgvT*5FXmZ-9@WxSe%VY7<V+x~2*hF=%wcXY#@!IE*p`
z9t|WZxhW+ektdWprVmVuzSN(+Q2_S1h+s67C@bAA<C&`Zk1}^0Zytc*4yCd%r<&Mp
zU2eMpOxb6i`{xTGD)m5@i^Y;-c1p@XZsMM#vc?)qw&m8C9D1&LJ^ZP|ci7-pxULbf
zM*uzsocveIVO-Z#lx{SvKcBRzPFj*FzGqB+dx=rQzPa<TV}GNZvZe~JePsEMK5{Xv
zx9{3lZTPWsBv<6~$}#e1T?4>9n3=t6ec?z~L3aI)YLSP#1pSTL&USbK;>k{ylG`ak
zphWPG1%Gxv={>M8wmmWj^zP!nr*~Uu7y>h~Z=t^k0Qg^hj?c=Bvf{PDd!0aGCsARR
zq}Q{(iPV-X&1UfJF`lbyBn0N~d_YZ*>>n?yAF>^3_5F`T4WKrnbhkB10$J~OOJw@l
zdBJcp4AcD;o@8GAUxg>1Hh-mW%~4jH9_k;BK0Af4L}8>C{9=*qy5%IGbhO4@gL7~R
zxih(RyT@&3a}_1TgJ<n8r$mk4y7=^f0^>;HGQlvaZnorn@p=3X!f0cTFo=m26>tn#
z4)-P@`W?%|HsM;Ui2)$=Us@MXr%&jKxNKJYIycu)$;CznP&8V6)}$_ghyNX^>x5Iv
zn!2%;CCmNFIT{$~zu?Q?|I9Prx<>fUs|5p@=5m~QBT&+Iz(?D(JiYj|f<9#6*<q7f
z@vaZk>s<quU&@PkV14{X?ypnu7rhkTa?SaE!z^0Jz~yBE2!4j^S1Xk@uRd$w)U=2w
zcl}?4HZR3W?4NG6RJV#Zk3}aLI1@j65uyP!DcI1(j_5qx<mN(W_C3>6#ChNI|K*=u
zB@kXD#eV^jsN62NnpD^2mgDX@{P?<{&18=DS`2nRZFY6<59F#d>vGj@MlAdXE|L@L
znDpaKfh#}IvkZ5x$yKfQ)g45B0Bd>IRkag+{{i<V6`7=-HU%g(pSZ*mzyr`EA<L8Y
z=0$MrRnwOyGC=;BA9$;F_d7wLM<ZrcTA<;xAt#Ga4wK5GK1_4Tkpt+);VDbk{>}hE
z`m9iLif)m&xh9{R(fJvz9|Tm-Xzx70{}d)td6<Uv#kD*G9iM_5c%LcFLpMIq3Tb>y
z+$w?g4a)y*o!tkyJTCCI$l9}K&v|3xJC>zZz@8i%+Y1<<hVO6S2ebfTi6@gWk0v7E
zS^qxDbUuT>s+#E%|9BX85L{6Bk?CIvc(RtjfLaT9Edcdwcz=sAAk}(Oy$(yOHY;iU
zlNZB{7cP%>iJcfCtS+6`&c<?Y9Kt{P9n%pE%=RYSa)otnKX8`KLc+qr0@!i*OkQ(f
z$7N?<>ML<}%Wp4HxNUSM<!gi3w;=A{*r6_YB~}!A6y(O5MU&yFZxl>r_+tXI`8!c?
zu$RxDJT%wxaBulk@XU@<l`FEdR<1_@Bbj&FnqvU|elpd*2TD9o^40=F+p+VdE}`z!
zQL{))la7Mqx)h_sbsypbqHBjGfe6&Y)3lhfElQu1B!&S0NA=$VJ)^7TsPkto-XkQQ
zkos(72x>j~spO<GyW2~=^u=va%*K3~oY?-Y;ZTjbHHU|A&7Jt%XLQ2NuCqRI4NFW7
z=PsY)%le<SD$M=D`-MY}BfQrCF_HtxXDI2jx)fswr~?B)KxeAN0EI?C5sp*0kR-3M
z))2u5pwR!Et(O`@Apek04mjL>ngsyAV$|`qiYp)<PsR8Y>;Tddq%6wU>-WFm%LEJ_
zpEaGsrZv4sXi0<k%C^@)^&HT$(@c6ARo41Cq%+)l{qJ>Bd!J{4o1m2Lz88+uC4j|%
zYzWvV0OkBL!#+7z3t+i|?uUs7LQdX_SNOMT+y_a)%6}*+ja?o}P3-?^Cjs#3+8@%i
zUWIh~ACCUnQ!c<*87ZE87Ve4rA9hkNc3ms<jNNc6-Ti+$`u}GxG2r{kW1c;;rhxCH
zmYDx<0W-?|B@%WTzf1C%Bjqi6EpBIc^MB=RH3uwwB41!k)E}3_y#JxV+ZBikd=@=%
z=5cxP0J#^}&@ch&kez4(K$O>f7=ZO|Ej5+P_19@91*$8U@EXc&lX!A?=Noa`udLAj
zMDN$r)LPUB$>X_BG&w(U{xCg1i}IygA5B&G<DTs8EjhUgh!=^+;IHf_9GTo-E&mm>
z00B!tBS23Mi2nj1{?Ma@c{~q1$8IeFNCP#Rn}$lGKd*&`n3d8kMH;B9;(Li1@F_z-
zqI`mpCBFpVL%s8<<iB+gf14m4c4}|zvuJi|rars`_4>9v=h_c=X?bsgKU*h%d3aRD
z=Pw6rH^7wlbBMHIwxZW_5ET@j)qjOB`d+j~3H`zR!P=OA^v!-F_5FJi>;r#V>zBmR
z(I3fK&cCb|_&VfrAAVo&N(3yYfCRS<-lTr$pD%^@Y=PYmSYQFfRK%0>g9jwm-{E*R
zr6BVAXN(?)tT%K2Y<2bz9@w`2j>HccGh*NG>1#li1DdIW`M*Q)zjY}3T$%L6c4>Pv
zi^L)+xp;nAYLc5q+4W65y7vkSx~aA1g|C??glKtrIY%zv)<&+`z<`|sa=|(m&fa+i
zcPU983i%2GUya->B_%bsRv~Zkmj~O}*ifE3IymUvqm?cI&{kX?H4eE8L%kWVb{K1R
zxHENN714boD>FZrCI!TV0*C8XQ<nxTEGJ5{p@jKhu9dnuku~m?_?GTvVOA~`5M?3P
zA{#sB27L@KCFqtocQ;x;&pk#CMUAcQlW*)QH+49-+GL-zx*WfHt~19}Ub&2UuhS=N
zcG{+NE;yxi)lfKKS=0~0U|vEO6wTEZBjn_y;<2!qqxF0Y?93;>ddq}`jq59wSDi<l
zLEpXVK6GfR_#?_8$yi9x8mVPDMBFMIS4w1S?)d!^7=i4%F4$=^QhD%A&(9M!0ckP}
z#9MCP{KRqYB!mJsRgX)el$od$K_o}=_ZRn+c6{PJ+*exX9!CD^B;Jdk<tr5RfKdZ3
zRiLc|w!h;28Tjs~?t+<&_0tA3GY5e45&1NPnOW^&{+wtkb-Odx`R$&)C7Dn-)?@CW
zA9X77_+dQH!$Rz=lM@~(`1T1@kT`o8c5lfz37TLmTY76=N&N{o%JA7jCJ<rQ4m@yC
zmC|PQ+2^>mQg(_(Ooh&jk-6o(Ik3`HPU&a~ZEk5!EB+5+2q*_aJ?@PS&%UK>hcb0|
zx56e{sUdnlQq;uk=CA`8J{Nu7fr#A3X&@9Qq@2*%(NF$BFNu~7P@6z1!s{kDwOeOM
z;O*P@BMy+bgWv++#>fJPex*)mq)m+5QwB_8{n)}az$IQIOC`xWHvJZQ;7F*@>9VS2
z(CfX{^Qyi$xc#I;DC9geoY{H)Ub{M1U!CEb?K%tpr2x#u?k|s99=T<Ju$F4CoX@7|
z!Ji*M&iv*~>FO1*mI5Sr3DvnbSZi-$B4;^Ckq#e>l4OB`LJyoc-{)Fsk;gVEf)rmF
z-1?Qg-?``1P^{PMCLZy6YwvvT{(P^ecw6ojd{iZn$rsP!0=H}=q5V-CJQ8WMpGw>;
z@v2mFT}EZ;<i<w%2FS7bJb%IcKLHk$X4_dt*ZSXVX+vN@x6Y_~S32i*lWt{ZD=x6Y
z@xqEBeO^-<oaEzYPRn0)Kk`SOm)QQF>ZNWd&OOc%Jg}N029LxB+%%d@8lS!SQ|=H&
z%uYh-6qOd7Kzgj363|Ba_)=FyE{I0TXtTw0-gYsSmYgT7M+KHC_1mBWSN%65EFtSh
zAp~8G14(@M2TQAzdT(CwU8%*7a-Sp4AUfPs%SWp<9G2KUCVusguopcmOa{2OX-3W@
z0p5rV_5`k=Urx1ABB^KzMT)IL`H#TICKuBdORVsHTy5qRm(7T;4y+zD+CbxYX>CI!
z$Vo2;x$;u?AD^0ZVq4uP?5Wj5sRIXHEH1zOBr==iod%Qpa1l34?b8Q%UrheV>x>{p
zhlLEzP10-WZm)Y03_{whv0_F2f*yW9cSTllHK{Q=Efp@PVCJ8SV7m94w-F|CVJLQj
zs(gF`ce&vFh<lv@;@pl;vp<!ubmfq-$sY5VRmZ$B;1=FYDBG!GgO<tZ#aFn99q85m
zvSzYP3J+dnottmLM6J~Vt0a2=xN?x5$E~sjz&wK%ZSYk%I}g65#e)!#u^dirPCwU|
z3Qv9(!LR{L-LXY3Bl?b<rV7yEoO3my&|~J-ra-^CbL<p-bJ)>&hbD~BSDOl(KMK#1
zl`>Nii*~D?BX>uyPc886NHFVmaE@FFCxr+!@H_5p2&y;nNV~sSnL&}&Nbsv)vI!f6
z#suC-3}9lml~NuK4Vt^8>T>iD<?!K=o#fjoCaSa>9bN~gwCBmk?OV8O2tv@cr*0Dt
z7MQV*%RZYPprYjnSJOqqz(Kv`6A_(u^+LOzAI{6p*0=Rvv{|L*pd2_*9*4qKrMOuY
zh!}fiK&!8`zo18*xEQI++MPe80M$t5BtiwbQ51fe=#R$gwk4FlS`0ycERUxC*xg2@
zc@8rt6GKFRIV0UoSa=`WbgS~xiz=Yzu%hHb(3}jNe<{2&i^r4l5#6{COsSR~xJe1-
z3R#RXb(N6S!W^Te06R7^F_o63rKdWzN(MI?<A@zNh&!8BVK*AUNNKmHk!EHhpL+Yi
zuVcxT4=!D_I9f04_lIkTqZc%)B?+hb95J-F*Y%?jS&j9+CQ?JpAYLv`4B`I*$#maH
zlINTe_Mi4^q^Wlc-5$PRzB0jG+Hrk;q05;{2D2}%^yWZWip$B=DeuH-wdX3!eOZ{L
z=~b7hPcPvC$(Q-9!2#3ZyV%3c76oJRR&;RGG#(mhDd%pLr83Rv+bR;U1nKQPPAqJ9
zci+viE?uNCMOG5pPdhxJHKWH%Gs$T$b%o@PJGDn4O_JqQw%-X;N@{FVLpQ%*GiveO
zBi0(LGX~UF?)YkbvFtqY;PT9ZG%~54J$Jz?^PZ*ZoAJ;i6eJpsVlUV5X*5lMTd6eT
z6ls+yyN*=m4o<<M-ioys8#5t{S#5`4FP)-e#~+4`hJ#3p))|c^%?9jQPP)0tV#wLZ
z-K;XuL$q6xl4na4ZW*G=!s&7-`&O$2ZE{1O_GW86s95St;*7km7r{G+&SLbXDfAmQ
zst~eBq?OBq6(h2Wtj$Ucw@-oKAJIm8Zqg4W4^xte5V&>CM`;vpmZrnSGR`-@I*Y`>
zCX@Jy3U7cj9QYmF*$tPjUfo#<T<=MqTy*Z4fv_&_?05gDw=#!eZdr)a^m01-<usPy
z15LX?k~cSAe*$i=LY9F2QMq=o!@AjSFY4;sPE}kz{{tlo{&@=X;hsIcv}Qfj<H5j!
zI0sLUjM32K)9d=i!R6hp;$_>iJ}Vq1-cevx7BLm8rB@a-Ct;IE<jMYgPNN%R40wI~
zQy-FT(yDlJa<tP);KkBQ1##ppI0lX4=adrd;lpOKLvVzBIGKy{Is57+h$K2};96_o
ziQ^r=z7C~9$ayO7Q8_#Y37o^bMUYKkU2Z(Wr&HBdjtbVeTG_@FR16rN_x4P)1Xc6h
zUJo?B#}8Yb2hnBa<r6L@M8<3ms{|#@biEC-_G{cs+^y^@{&DAcK@L}n(LIBXLAcp>
zH59Tn@it1VqD9umX|CghFqLAGjwyIXPPV=!K-uIikK@FjUi$R0vz9qcD@ciF)*lQ<
z6*&%d;+~nhB>BigH86wF3}MxWTPhi5@$+5TWmogdXU_I|e;hPS-LE*!#vjX>drfo7
zEv*bOS1E_*`G2~rObU=ru=WYUwcXYglG?gs01xirI@9S(i>N<{T(7oM%C;zs2Z7$t
zo?nHA3LOspb>HtedU=9vLOpiSJR?V*X^<x{q(B^*FBZ7WD*`L}^-~54*A~isDpg8=
z<8anAWLt&1T1WeSSVZNa+u%v_Fb;L%ctwq*_XF@rAzf_ed)<_1bE2;mgF?_XX4EJw
z%uZIf6O*D$xl01LmAlaM8=;CD@CGm;wFh9rlsRrjLLddaXm$W@n${ky{qd85Zj+J~
z9$9@alY%3sU1lOC8=WN4(w;59;o^dJWUihdtRD8yCwTX(alGamv_cwQZsntvP6U$f
zSd}azqDmh_DwCbubu|K%sUJ3u_^4UGUnUAZ(1slJ7Kc_4dD_)%5ZDoUwz_^1VSXg;
zCdu21QPo+SU_(Zx86kI=pxf>0ALZ`lpeLfXjBuYTwpyby-&}A<&nX_Ip1lrITWB$$
zKB5g7zB)RSH0gQkFPcO~X`-tjXrw{fqPk+TPt1c|tSyRyF7r7^ttk>(g`keey;*k=
z>X~?f24+`_+)S9HC<$GC9R%5BlmXk=RvlF6eXJi`XFbCAxZ_M9xQ(TPDE5b7szhX-
zxaaR7{lufQCU@gcoFfGKM`w6?g4nT614dB#z0@s-_FLXr(3!jSg#J#<q;6xs$F-?y
zGhQy|)Xb^gI#uWREh&sR7;mIO#cw!#q>vCvRzS!3jEPh?q@8Gct*cL@Hb?%F+)p2y
zeU^yxBayp!pK-^6l~BGf-)wm()K?mF+dRC}Y&v<Ma!Q{uoG$6xU!8>G4%JiZtSGCZ
zAD&~Oai%8O%KVQJykkvdj>K{7#Wq;Kt`Oo4NU<!ZW!d)A^ToOL3JSlklbUQSIltnQ
z>W<EI#Hj#ctvN&9mqt3Nu8!^s#=tN>TGs{Irf(9k(~n%cmkB4PW*Zf+58LUXP~>2(
z>uP#c4>CBtI1^Zah)`oLZG`G_OMQ6;QxDPBRjaG0r=O(kR^}y~Y^bc}p)M=rKrSV`
z#gm3{FUTVST|-+NBX9$@j{cF02B^xTDo?MFX#*;4%%>M4pz)uU4lI}8CFtE`GP@s=
zg0)|5*JvgaC%uHu<b2$WRO#lvzJy$0y|K^YmXRmDXGQV#uq&pttk=ji6|T!eW{NwB
z+z<qrXic!9ph=|u+vYu|MJ$V@B2r$Ky_~Ro<<Y$v7jf;Ky1#x30lM&<8K*dv+(=!B
zHDQNUi|l_b$eIq--v2tX!af%#3m1EdIu4Vt1pTbhQ8^WAC}8VZoNHa&#GM~2C2l>G
ztP)R8F(ikIGWy=wB)FZ^_`Q?Z)3_Oj&XrtJZDJlwbGR5)aeOs}y5cW#tGq|y-SS6r
zp<LN}luJWDiFrlSd8(Z{El6n~6J0`#p+s*Z){_RrJ?>vT#{Ryh%2&&n90U}qy_I?f
z%@==V-$_T<S>ReTxz#b8+2xEVJ61G@7sTnoC2de0;uH1$U?C6DoQLf>^V3fUBG)bu
zAU4J2j2b~a;+Ra6tuSYg+!!7NTcm<JMS8@Todh^)1tj#&vR9NhAa2W!Us+$^cg`j2
zt5l&7c^0}9hL}~oub36~Laou9B73z*5Eb3yqSIK(>a*hf(L%U0W#Q8G8Zn(Jnr%!Q
zxC0N^^PDGj$z|h2irOLJc!o5L%d_<w9tPg+k?OKcop%_DN|{6ZOvur@FI>`HcAE~q
z;qI9*b)-rVmA?(<*hUTPba4snL~mu`FJ??cqC2^av%c>~vWSTa%U6|$c3-v$SoNXK
z4y<zEJ;$aws`bp&*C#a(R7yNET5*2Xj}u9dTh!H`wi`O@z$<TZn$4o$QS}FF;D7t1
zQVx<B+K6$P%<&PL_3im%$o=E14cuZRwpC<v-n}VjNv<fu;#KgQ=1iV8DqqY{&&LZh
zt`va>5$WpeNJ+Zrbzk;np|u5S+j$pn1mkw;(Wb6JmdG8pcPG;84vc^Tkgw3(A)+yG
zEMBGDN~^tCd+63FIsq@J2fvZrfyWQ{=8!;)>n$e}@Q<pEL3E$UVE+*z#9UePuGxOm
zcB~A;L?d98Tx>VIq10BA#qe$no&W+lX3*TkHUqU`Nb5{lbIG!fKX@#h(W9puL3RnM
ztehfS`*vzw&b|6pe}x1^(aB)CXZ&BNy9WZ0iNZP3kq0X(1YBCDpGaaG`oT(TH{i>-
z?^+ZJ`!EP?Ct_BSBr@qV^brnyrS4TI!M{T=H;weOkmAj|DbV}6tXnz@p{8vMqGSX{
z;hEqhVCbDUZpt$~MOWiI5o2k|Fa&Z}Q<(iS$<{{$;PEazYbsjL+#j1X(sr|^7mi7)
zuf%HXqP<#dJ7M*)BM<h={rQ_3g_kl1D<cp=pkcfa86SLcBH8C5)VgEtWw8st%}?=1
zd^<+^IjgUvS$mgdVi|#Eq|s`^ym<qGF*Gt@STW&<%N1SGiqvq^=|z(#Gr?-{SrM1-
zs6$PBuM(Ga_=Mr_t85#}aIt{?8q;3!jxV>ATo7Kd$kC{U*AlQlh158f&T4zn_O9ks
zc$h~jWY=p~4vk|*@3NWAx?IkCjbB5UQnkn1{hg))R?hXJxVDNjG~6O+BDWqUiXdFX
z!VGQLMe=d*j&}x;$^)&;{h^h5*{aU-*gl>#tG$rnNS5295#Y3j(=*S&C8Aq`C1xzJ
z2K^EW;Is5HZuk`QauCVB{iIXu<ORNme(ib0txCir1M{Oh>~?W9Uu6Y?1-e3X(V;XW
zjhmf(&mxv1j-Rx@&^lx`;N$HLC)nM<O@&{pq*T?jIxs2^%`>=&g*fQ>$5!kyF+QO~
z8)*bg&-H^W9=gaEflyOt`|I7TbY|&g6^htLi&FKQfh0{QJK=>K(lzzPiVn_8#Tq1Y
zsx(mdna@jZYl8wZYgN^DD>^ucRK8dl6IP)$70j*Vxm?RtDiyA~B+m_nema+2T}2^5
z_BpjB7UX-S&2wBIHLuB^yen{(DvB)BXeYE<T*%BE+KIYKz6{+nW?ty%58m)(JXB8Q
zl20(L`0o6I_wLO&yzN~0IB)ooJEdbkA7k&ohe&=gH(G5kgcVSCwj?YsISH_K9C%a8
z8u}#WlDCV~6vTtz-l>Ok%=hieLz&;X{<d!b-t5C!vA#Q9?Etz#{SdT8&z#~ivA=7M
z68u)u_xj9ndEX)6ABN<c&fV@OPY}2txT~QO9w`;&Os~dZBsGYHm%s}04WY_bBs%J=
zf?I}|8L0;dw{H{N(Dj#)oKWbK?P}Uu1&y2UH(F2Iq7))rcC&iadfv`O3JRgu*nMwC
z^6#WtfH@l7<_dnKWo^MVK6jZzh;K*Ks0r6E@-O-2K>~d|+sWzM5he@7qMM{?(B`Ew
zf=|X)Y)!}HgU!|T?RTmm1Uomf58?dWJiL3ineEW#2AHoPXzKczrO|kpj5BRRJm!(|
zUvoPC%j^9trEy4>H&Hje&>fE6guB;PC(N48v=t%<s&~Cs)$!?<?Q8I*2*%7&Qat9#
zIw^QH?Ti>7l1fhs7uK2vXh^cdK%_5(RSSX8W+RJr<N6D{Z!Q?D<$=;GT89~;$%D|D
zvZS#^l;diWp7(|Mv9vS}K9@$*sbbH)5#_+-&U=;SnIP0Qj!F=F&n<sKsg&P6pFohz
zXskXWaCb`Y#fkU1swXArLKP%+&H}uq-!t^mho?LU0$XEdu<8}y%T+BGXqwNkfgK5r
zX)im-*_J50$0kxV7YxQ<v!b9>S%HF4rx<~SV+q8!L4r@09zBJ*9spHe)u{cbC2d%?
zh(a{v*Ar$-Cxktz+v=O%{5HX;r(sDL!$@<oj^ni3VVI0vw*q(PURa{K`cRBjH$fh+
z1%U27$N_TxZch37WJ*kntKEAp?BZwh=M-Mtf*S&D9IC&9oAY9ca7Pp5M0}pRP6#EH
z0^5_Oqt@FfWb;V`Q8*GvB8kACXk1bc01pgZtgb@Y+FDplg?DiqRMQuj98s%kd~Ycj
zth_)^tr7n!I4f$u!=|_b0U(@hC6!Ezn#xUj1XOw-_kIcjt4UCfI)NvH%FcKuSo>jH
zR!P=e!74`UwFIa8+#Y|<7=G-nWD2c4&U3XExkD2#6U^m!g-&{jA!0V;<oG@q9d0_b
zYfOJU<mmf#?P{d;v1?WEm8@q2twLP!xRJ`~*}SXemvo-lcs(-_>Q?dP!dY5dCmn|D
zYVGysnUlNQ8+lL_7hT@JAPRuWQ6Xf#SNSVDQU)bxf!W1574sF<JP~sk_7?6Z6}g#i
zEmPL2d;-(Fyq(AC<Z1VtouG|16?Q+9d9t5ZkOy$q<0+Yjkxpde@gBhTM4^|6Y2y%Y
z;dnXDgFJ7{92$K<U80clY;Flj9FjdTi1L>q*!Md>O65V+q@E<K2yoxL$52k*8M0Hw
z(?qM$zao-`IVeaKsxLHew;F%n$m;6q!eFWU-Rb-hooRH(Wd0n{7X#XvpTDS`8bx?p
z7|N&Cr+QD5G(XKLz_dNC+Bo`2jBmjud>f)huqWn2E1hNFH#7!fjX01UCX!E9i)=Vx
z8|m;x%e=P?euw3{9--R^{K+h8nt+{F2kf-$_ij*<yh@WfA8(dqmasA`H$`<|Rw&}-
zxiHrKDwOKX9|(i1?X8!g+eO?zCSx*R4uS~QS#xewFSm6<+b0w?nBg5rip(&M!4VKB
zZdOYx9z2xtSf)Y`-U;Mc&z|&FM~=$ev90@W^za_XJyY&iEw^e_xTYvh_o3--l)-X+
zA|cbpu4ztr2h^7`Plc=A4~nSlwqu0oCZb0Goi19a`cUOt6`r}BJLVWFXlM!+#&nsw
zc}-~Vj9d=W=MJyI$rHTbdN*5KfdUs3%n=nn(U1>e*!MYkj>tk+H!R6M4--D2etJsu
zD8FwihHrmG%H;Xkx>IOW`r++-8uXhF2RJk&9kg$U7yyrWQ=Z8LfOpA)YT4kVL33Jf
z_|gsv60VMZ&ZECuX!?x2iMI@db}BfsDo;|e>%tXD_Vy@5T!T?F!g5XoqK`D@XN9!y
zB<CmGBn`YY8TiGwG{4Pfl-)Z4o)+0YJaF7N-lif(U^3QyJ|{(;{NTW{_G92;8kSob
zw|pXIWmQ3Ui{!7~3CDH69G<(1+kA-^v20sLLu7Ge<Jy=F-aUCH-c_%}ZC~K4nMwIW
zXU;t+F*Vy8(@kVfM&GGo($HkAB89i{R+QTgp{r1=y$1R2o9S+aeHGn^#w$^a5;ihp
zy<^dF$#LGv47p6;SQbJC?0&$*r?Wc(=~0%OEw{MEN!%ul$WtM&u7CZ?z0<y|`!GD&
zpFyO0S!A6TgXmWD_r88{Rf5EE$CjpUG!=$Zl_~GtF%N}D%rhVr9oSUt#Yz<q!}fcr
z6Nfr$x|55>?-L&Au+Uz6rk3krk`=@{)de44Pb7fieHo?Cjd?fYrpEP$`t5qx@BQh^
z&otGOq{}WFccw}1`8eV`t#G1U-KR|Bl?iC7THdCT&MMT7bY>C)&nZ%)-&#g5VlQT@
zvKi(a>aYkRwi&gWgY>v93q*n($)l<+t!%u9UXVO{)BtIrM(ZSV7W|euUA)<q%RBx+
zyoG9dgMv+z_=WSb6H+_|qF#kIo%ivS<o6<zR`72TN76JfBMW8C`M6s}u|=d#_7V5d
zye*3Yev!TMrKC2TA#RK3$61=MWWm#;{V@3%b3gg{Wg|3aAMv_Gk$lNwgjK+ha>m-h
zeiZyPrF?Q5#k=#3HJ?kz@AdMP&&17bz+TbVk6hotnYZLNPEuHKSY<+U{yqxC6k_KV
zL;?|ECMPtzrsBz{*jA<fE^s~txt5{<Wcq-A`F@y6vhs~5PCYq2gsc67=A>g~TJe)1
z8eGrx$)R)Jp7nV>4npvJ$Sa>tzH<?5f+%NEhoo)IEmdXLL{B>S0D)Tj;g%A{nUKnT
zjoYz2276eDl~wasB9)V`uP;MFXDGBk+_ms23nY0qNVzYx)<yjppkD#H7#~xFIB6d3
z4jfIUKiIzX;TYpVIq}LX%>mL;PUx5F^BY^9Z&BL^z)irW4KpgS3Najb22$F+2YqU)
zI|J}DhDq@oxZApS`b=Y90B*3pvEsP3t9fkPs+YDpG!2`GtCrs0a0l>VVu}cQA+*eG
zn!5=f=%tXTMv@`mU#b%?=r-%_g!Wf@&Z#?z_XSj}{G%{HwcL!`I&<f)wf`;ZPAkZo
znCHVzsul7yMG8Z^k92s&PsSdhcQYoX>l#6%w#BW!&h(tnzz>b#TYARk2NOa7P0~x8
zpl<599`Z&BZ^w5DuzE^|uL$Xn_DRc8&9_B%bq5NMTAB2ur|3@?c}3275_>b~%?zAI
z_yIB4ynpi2=ChIVIrn0>r0<WOj6GU~n#)n0%a9{?xi^<kgFv^g)W{|S^Yc>C{zE0l
zla7>o-`Ph1fz8QJ%IAJff+Y%5tFVu!+j)(6_!05~k1CtMMznJ^M?mb+@boUtE0RLN
z{u4&{vM^TpmO?ydS*hclp`?&ej@ZfNg$`yaZd86TV&tP=e;&J;%uGSRPC3qm-ws8~
z`IxZc^HU=<)sbChuQntZ_h}>*6EE}o0?w+09wj<&q;YqD#|ul7_>7cmJ)m>&^>t^L
z3D1Ch^6nJ=z{kJz(I&ZPjZ}7+aF>-%Z0bf~%6I=fO|Jc<Am)<1^8-Au0e2k`up=UV
zhQiYq(N!oOhh-IpV=<SA9g)0lxQ8_jlgF(98YcZCdXh%rCyu1EXC&0D+)DG436ai`
z^zMuE0=AZm5(X(E{jm0MYs&l3!pi3(z;~W<CcVlkV?^s9&;B}=b8lJy-DceKY}bno
z>`}U1<l`@Da!)C0uWcq8xMPlzl)c$GlF{8!3EbMYc0i4S^`%~bTC95dK{~cZgCD1?
zWP*h>&1|p8`4^ML@)oVcvC?bx=X~Y|)dM#W#(k*>pCX8vU!3(PW_y8Aj<FuZu7?lY
zyk5hrm?_d_Pv0b6J!e=a<XP-Zc;$G^tU!?A+UDdrGp2=Q4&_C;*Ub<jpi;tq_AT1I
zZx<sP-K$ZOJcwn%21Zq&adPR@VRKv0d$?S#0YB^31^*#&^ZMf=Y(a~y3uQR&k`-1A
zTLpH1VXRe!B3?n4N85%TeY<YD7;gK;tY%0*)7s_j+`a?L_C}1e)b8Bgg%>74iCQ}j
z{4U}!q4WYACX6JLMp79?`6)+|;e8Jjo0yE!E$TxkB<7eDt1+fOz73qTlz)1@VK?WG
zk;Qi5-zpoxcW}9;`||uK8zUL1H%!&alQ0TG%Jdl?R1ca9yZMva>p<c9Qyrsi)`^ol
zf1Z<`9zxYi_URP#WdWtgNZ;;v7C{s9uf^0)())5~?ux^&Uk-(_9C$Ya+`0&K!(Zq0
z<!&Cd8{Q(sFEr;<`n{Ud_d%Ir>dSBVRaDGH%#%;Jo@Nbh)D9w{P0<ks3GC6xo!uTi
zM*9zPZqsigCUc9oayg}R`DYB+lrrVXdzD?~G<WRiBh!%b*40Hl$lCfvDytt->oB*x
zWplli?;?>~w}MsY-+zDl4AVzt{0~yonXNMu^7x5V>BHO2xhKa=%U2_q+D!WB^?F$7
zC*Om@xzjG1sAM#AC|7v9=xJw-fjfA%;#kbo0`bE<y(lJ<_PpJM5qhAU&N_~TY<CsG
zJw;qwiVRJ8oRz|<M@^OfvedsxMZ6Eh{h5NiwY<U<sWYia-;gIvVw7raVTA6#O`c+f
zBvGPGGLYjGFM_a-<ZLGM<%7!KaILCE=gat(D=B?B8PDjUscgPO)umO6f6*w%U&?6p
z%d>92ng(CAV{$(!F6W9r5+4gAb+s-A_CDLP@fvS{-CHT(aMt{m&3pZWf-JjA{kR3?
z(&LR88g28sY)AjlxP}!X5)X176kK%I)n(2V`9Y_;3RZ?T?y{i;t%@|h-v`V;V)-#2
zFL06cMld@g6&`v=Lx<r#pw{8&(k%gBjvrVdCP(K14=L^c#qs3)UMw%9h_cT=S!!bm
z1?=MAi11}#o$On%3HbXs^relZsiDvhdRnArll@|$vt~>P=c$1Um&E(WHj(Kw_zxRY
zk*CRLksco`#6p_qh#+S|tPH)odD*I;Pi-ZZn|Dose(R?Sul6}lmO?0VBWvJ}xAxlz
znI2q}#K7%T=_Egu^5}BK;Ij4oQL*pU)eizQ!M2&1_2^u|r7kSCsY$BC?kBQ&Zde#7
z%m20xCpU#EXI=D3@MXUWq9N>2g_z47OI<heb)J%&g?@PgbKaB~ua1M5H*a24<zSXg
zeY(I`!Ya8{6lLDAS5KEr4cX$kVh=wi4zM3gb219$-ED+yP>_J7vaY$9tI*!QHUk6X
zipgkZYK355N#7*-ZUhSt+RmGYVy2^nRE9CZrIh`{=_*q`@vJh#zET%o+$DmeuNrTm
zPZ1Jfi_j0<v<;l_6}IO!IGFsWFxIH;GfDw2ee@%h$<lPCB&|%y3{J&6)eb!1w;>Bn
zSwRI=sL-#RHvYHsQWgt59h$34I@8JkCj#8XrjdC@ms7dg+OKH0Fj0{0X+{WhVOu}3
zIzs55JIHj$nEdsWy2gljq6#!S_Xya6Hf*U;+9Drqn+$8LBJjC-yoTgS!!#xvNL#`1
z^TZ@hWo&-#>WVkPXP~|ITy24Qq}mw$3=ZP)8ig^A^%8m!LkUKcrSN)^<`1a|hc#R6
zHpKB_XfNaokNL*JfBw+AN9^^<BVylovZb#hNyl510@7avmal($ti7fYfb?80=zIa&
zU-=k*x@Wj|-Pzwobin<kNPhi&Ne3USud3*t7mvOmo^KkHD7D_mENnC42d&(-4k-@j
zo!R$I@4mD{(QLhurv3@+AGGrDx<^URGU%^>@J(avv)3D$z9PpA|K<;0%C36rM;u~`
zw*0lMzG+Ou<@H7y&f2U9e)ESft&Cnb1xh&cHhn$7e+|Xstk0IeKFkd0OW69RF^AVL
z{V?j>ANzx$HeHti{_leLKV?C<E&&JE1b(m{?rQ4rctg_9pe(wHu^pZ>r@y}_4&K$2
z1rAnQ9$@{ol)nARzVfFk$hbzxz{c-K3C$Przyq>7zBVX*v)L8FcLza>B3g4Be$a$9
zC9#x$tHzhz@=q%~QC@RCX*E)m_RYtB6(usoHG#{-f<(Uh)t7w({O(?hz(IN|tNyY7
zw>|soeO<tvJ9)KLeE;;~KmV&a4%90gId%<dUw`b^`}EefovfbWZ_I69H|F3Xu(ghJ
z6-I^sdgr%46$1gn<@Wp!zQ66@<5ggHCvt!H<oo(#zZ#EwmcRqWr|28LZq--MHUt2(
s+=BeIeCwZ``X)B~|6>^payKkNVNLmP-5B6*^Plw28EfaCy%zZY0Bl0zYXATM

literal 0
HcmV?d00001

diff --git a/docs/skills.md b/docs/skills.md
new file mode 100644
index 00000000..16045860
--- /dev/null
+++ b/docs/skills.md
@@ -0,0 +1,649 @@
+# Skill Deep Dives
+
+Detailed guides for every gstack skill — philosophy, workflow, and examples.
+
+| Skill | Your specialist | What they do |
+|-------|----------------|--------------|
+| [`/plan-ceo-review`](#plan-ceo-review) | **CEO / Founder** | Rethink the problem. Find the 10-star product hiding inside the request. Four modes: Expansion, Selective Expansion, Hold Scope, Reduction. |
+| [`/plan-eng-review`](#plan-eng-review) | **Eng Manager** | Lock in architecture, data flow, diagrams, edge cases, and tests. Forces hidden assumptions into the open. |
+| [`/plan-design-review`](#plan-design-review) | **Senior Designer** | 80-item design audit with letter grades. AI Slop detection. Infers your design system. Report only — never touches code. |
+| [`/design-consultation`](#design-consultation) | **Design Partner** | Build a complete design system from scratch. Knows the landscape, proposes creative risks, generates realistic product mockups. Design at the heart of all other phases. |
+| [`/review`](#review) | **Staff Engineer** | Find the bugs that pass CI but blow up in production. Auto-fixes the obvious ones. Flags completeness gaps. |
+| [`/ship`](#ship) | **Release Engineer** | Sync main, run tests, audit coverage, push, open PR. Bootstraps test frameworks if you don't have one. One command. |
+| [`/browse`](#browse) | **QA Engineer** | Give the agent eyes. Real Chromium browser, real clicks, real screenshots. ~100ms per command. |
+| [`/qa`](#qa) | **QA Lead** | Test your app, find bugs, fix them with atomic commits, re-verify. Auto-generates regression tests for every fix. |
+| [`/qa-only`](#qa) | **QA Reporter** | Same methodology as /qa but report only. Use when you want a pure bug report without code changes. |
+| [`/qa-design-review`](#qa-design-review) | **Designer Who Codes** | Same audit as /plan-design-review, then fixes what it finds. Atomic commits, before/after screenshots. |
+| [`/setup-browser-cookies`](#setup-browser-cookies) | **Session Manager** | Import cookies from your real browser (Chrome, Arc, Brave, Edge) into the headless session. Test authenticated pages. |
+| [`/retro`](#retro) | **Eng Manager** | Team-aware weekly retro. Per-person breakdowns, shipping streaks, test health trends, growth opportunities. |
+| [`/document-release`](#document-release) | **Technical Writer** | Update all project docs to match what you just shipped. Catches stale READMEs automatically. |
+
+---
+
+## `/plan-ceo-review`
+
+This is my **founder mode**.
+
+This is where I want the model to think with taste, ambition, user empathy, and a long time horizon. I do not want it taking the request literally. I want it asking a more important question first:
+
+**What is this product actually for?**
+
+I think of this as **Brian Chesky mode**.
+
+The point is not to implement the obvious ticket. The point is to rethink the problem from the user's point of view and find the version that feels inevitable, delightful, and maybe even a little magical.
+
+### Example
+
+Say I am building a Craigslist-style listing app and I say:
+
+> "Let sellers upload a photo for their item."
+
+A weak assistant will add a file picker and save an image.
+
+That is not the real product.
+
+In `/plan-ceo-review`, I want the model to ask whether "photo upload" is even the feature. Maybe the real feature is helping someone create a listing that actually sells.
+
+If that is the real job, the whole plan changes.
+
+Now the model should ask:
+
+* Can we identify the product from the photo?
+* Can we infer the SKU or model number?
+* Can we search the web and draft the title and description automatically?
+* Can we pull specs, category, and pricing comps?
+* Can we suggest which photo will convert best as the hero image?
+* Can we detect when the uploaded photo is ugly, dark, cluttered, or low-trust?
+* Can we make the experience feel premium instead of like a dead form from 2007?
+
+That is what `/plan-ceo-review` does for me.
+
+It does not just ask, "how do I add this feature?"
+It asks, **"what is the 10-star product hiding inside this request?"**
+
+### Four modes
+
+- **SCOPE EXPANSION** — dream big. The agent proposes the ambitious version. Every expansion is presented as an individual decision you opt into. Recommends enthusiastically.
+- **SELECTIVE EXPANSION** — hold your current scope as the baseline, but see what else is possible. The agent surfaces opportunities one by one with neutral recommendations — you cherry-pick the ones worth doing.
+- **HOLD SCOPE** — maximum rigor on the existing plan. No expansions surfaced.
+- **SCOPE REDUCTION** — find the minimum viable version. Cut everything else.
+
+Visions and decisions are persisted to `~/.gstack/projects/` so they survive beyond the conversation. Exceptional visions can be promoted to `docs/designs/` in your repo for the team.
+
+---
+
+## `/plan-eng-review`
+
+This is my **eng manager mode**.
+
+Once the product direction is right, I want a different kind of intelligence entirely. I do not want more sprawling ideation. I do not want more "wouldn't it be cool if." I want the model to become my best technical lead.
+
+This mode should nail:
+
+* architecture
+* system boundaries
+* data flow
+* state transitions
+* failure modes
+* edge cases
+* trust boundaries
+* test coverage
+
+And one surprisingly big unlock for me: **diagrams**.
+
+LLMs get way more complete when you force them to draw the system. Sequence diagrams, state diagrams, component diagrams, data-flow diagrams, even test matrices. Diagrams force hidden assumptions into the open. They make hand-wavy planning much harder.
+
+So `/plan-eng-review` is where I want the model to build the technical spine that can carry the product vision.
+
+### Example
+
+Take the same listing app example.
+
+Let's say `/plan-ceo-review` already did its job. We decided the real feature is not just photo upload. It is a smart listing flow that:
+
+* uploads photos
+* identifies the product
+* enriches the listing from the web
+* drafts a strong title and description
+* suggests the best hero image
+
+Now `/plan-eng-review` takes over.
+
+Now I want the model to answer questions like:
+
+* What is the architecture for upload, classification, enrichment, and draft generation?
+* Which steps happen synchronously, and which go to background jobs?
+* Where are the boundaries between app server, object storage, vision model, search/enrichment APIs, and the listing database?
+* What happens if upload succeeds but enrichment fails?
+* What happens if product identification is low-confidence?
+* How do retries work?
+* How do we prevent duplicate jobs?
+* What gets persisted when, and what can be safely recomputed?
+
+And this is where I want diagrams — architecture diagrams, state models, data-flow diagrams, test matrices. Diagrams force hidden assumptions into the open. They make hand-wavy planning much harder.
+
+That is `/plan-eng-review`.
+
+Not "make the idea smaller."
+**Make the idea buildable.**
+
+### Review Readiness Dashboard
+
+Every review (CEO, Eng, Design) logs its result. At the end of each review, you see a dashboard:
+
+```
++====================================================================+
+|                    REVIEW READINESS DASHBOARD                       |
++====================================================================+
+| Review          | Runs | Last Run            | Status    | Required |
+|-----------------|------|---------------------|-----------|----------|
+| Eng Review      |  1   | 2026-03-16 15:00    | CLEAR     | YES      |
+| CEO Review      |  1   | 2026-03-16 14:30    | CLEAR     | no       |
+| Design Review   |  0   | —                   | —         | no       |
++--------------------------------------------------------------------+
+| VERDICT: CLEARED — Eng Review passed                                |
++====================================================================+
+```
+
+Eng Review is the only required gate (disable with `gstack-config set skip_eng_review true`). CEO and Design are informational — recommended for product and UI changes respectively.
+
+### Plan-to-QA flow
+
+When `/plan-eng-review` finishes the test review section, it writes a test plan artifact to `~/.gstack/projects/`. When you later run `/qa`, it picks up that test plan automatically — your engineering review feeds directly into QA testing with no manual copy-paste.
+
+---
+
+## `/plan-design-review`
+
+This is my **senior designer mode**.
+
+Most developers cannot tell whether their site looks AI-generated. I could not, until I started paying attention. There is a growing class of sites that are functional but soulless — they work fine but scream "an AI built this and nobody with taste looked at it." Purple gradients, 3-column icon grids, uniform bubbly border-radius on everything, centered text on every section, decorative blobs floating in the background. The ChatGPT aesthetic.
+
+`/plan-design-review` gives the agent a designer's eye.
+
+It opens your site and reacts to it the way a Stripe or Linear designer would — immediately, viscerally, with opinions. The first output is a structured gut reaction: what the site communicates at a glance, what the eye is drawn to, and a one-word verdict. That is the most valuable part. Everything after is supporting evidence.
+
+Then it extracts your actual design system by reading the CSS: how many fonts are you really using? What is your heading scale? How many colors? Is your spacing on a grid or arbitrary? It structures this as an **Inferred Design System** and offers to save it as a `DESIGN.md` — so now you have a design system you never had before, derived from what you actually shipped.
+
+The audit covers 80 items across 10 categories. Typography, spacing, hierarchy, color, responsive design, interaction states, motion, content quality, performance feel, and — the headline feature — **AI Slop Detection**. Ten specific anti-patterns that mark a site as machine-generated.
+
+Every finding gets a letter grade (A through F) per category. The report opens with two headline scores: **Design Score** and **AI Slop Score**. "Your site got a B on design but a D on AI Slop" tells you exactly where to focus.
+
+### Example
+
+```
+You:   /plan-design-review https://myapp.com
+
+Claude: Design Score: C  |  AI Slop Score: D
+
+        "The site communicates generic SaaS energy."
+        "I notice the hero section uses a blue-to-purple gradient
+         with a 3-column feature grid below it — the single most
+         recognizable AI-generated layout pattern."
+        "The first 3 things my eye goes to are: the gradient, the
+         symmetrical icon grid, and a 'Get Started' button that
+         looks like every other 'Get Started' button."
+        "If I had to describe this in one word: template."
+
+        Inferred Design System:
+        - Fonts: Inter (body), Inter (headings) — 1 font family
+        - Colors: 14 unique non-gray colors (flag: >12)
+        - Heading scale: 36/24/18/16 — flat, no drama between sizes
+        - Spacing: mostly 16px and 24px — no rhythm
+
+        Top 5 Design Improvements:
+        1. Break the 3-column icon grid (High, AI Slop)
+        2. Add heading scale contrast — at least 2:1 ratio (High, Typography)
+        3. Replace uniform border-radius with intentional hierarchy (Medium, Spacing)
+        4. Kill the gradient hero — use a real image or bold typography (High, AI Slop)
+        5. Add a second font for headings — Inter-only reads as generic (Medium, Typography)
+
+        [Full report saved to .gstack/design-reports/]
+        Want me to save this inferred design system as your DESIGN.md?
+```
+
+This is report only — it never touches your code. Use `/qa-design-review` when you want it to fix what it finds.
+
+---
+
+## `/design-consultation`
+
+This is my **design partner mode**.
+
+`/plan-design-review` audits a site that already exists. `/design-consultation` is for when you have nothing yet — no design system, no font choices, no color palette. You are starting from zero and you want a senior designer to sit down with you and build the whole visual identity together.
+
+It is a conversation, not a form. The agent asks about your product, your users, and your audience. It thinks about what your product needs to communicate — trust, speed, craft, warmth, whatever fits — and works backward from that to concrete choices. Then it proposes a complete, coherent design system: aesthetic direction, typography (3+ fonts with specific roles), color palette with hex values, spacing scale, layout approach, and motion strategy. Every recommendation comes with a rationale. Every choice reinforces every other choice.
+
+But coherence is table stakes. Every dev tool dashboard looks the same — clean sans-serif, muted grays, a blue accent. They are all coherent. They are all forgettable. The difference between a product that looks "nice" and one that people actually recognize is the **deliberate creative risks**: the unexpected serif for headings, the bold accent nobody else in your category uses, the tighter spacing that makes your data feel authoritative instead of airy.
+
+That is what `/design-consultation` is really about. It does not just propose a safe system. It proposes safe choices AND risks — and tells you which is which. "Here are the choices that keep you literate in your category. And here is where I think you should break from convention, and why." You pick which risks to take. The agent checks that the whole system still coheres either way.
+
+If you want, the agent will research what's already out there in your space — take screenshots of real sites, analyze their fonts and colors and spacing — so you can see the landscape before you make choices. This is not about copying. It is about getting in the ballpark so you know what the conventions are, and then deciding which ones are worth breaking.
+
+After you agree on the system, it generates an interactive HTML preview page — not just swatches and font samples, but realistic product pages. If you are building a dashboard, you see a dashboard with a sidebar, data tables, and stat cards. If you are building a marketing site, you see a hero section with real copy and a CTA. Everything rendered in your design system, with your product name, in light and dark mode. You see what your product could feel like before a single line of production code is written.
+
+Then it writes `DESIGN.md` to your repo root — your project's design source of truth — and updates `CLAUDE.md` so every future Claude Code session respects the system. From that point on, `/qa-design-review` can audit against it, and any agent working on your frontend knows the rules.
+
+### Example
+
+```
+You:   /design-consultation
+
+Claude: From the README, this looks like a developer analytics dashboard
+        for engineering teams. Sound right? Tell me about the feeling
+        you want — and would you like me to look at what's out there
+        first so we can see the landscape?
+
+You:    Yes, it's for eng managers. Show me what's out there.
+
+Claude: [browses Linear, Vercel, Datadog, Posthog — takes screenshots]
+
+        Here's the landscape. They all converge on clean sans-serifs
+        and muted blue-gray palettes. Linear stands out with dark-first
+        and tight spacing. The rest feel interchangeable.
+
+        Here's my proposal — and where I'd play it safe vs. take risks:
+
+        AESTHETIC: Industrial/Utilitarian — data-first, every pixel earns its place
+        TYPOGRAPHY: Geist (body + UI), Instrument Serif (display), JetBrains Mono (data)
+        COLOR: Restrained — slate neutrals, single teal accent (#0D9488)
+        SPACING: 4px base, compact density
+        LAYOUT: Grid-disciplined, 12-column
+        MOTION: Minimal-functional — only transitions that aid comprehension
+
+        SAFE CHOICES (match category expectations):
+          Geist for body — your users already know this font from Vercel
+          Slate neutrals — warm grays feel right for data-heavy UIs
+          Grid-disciplined layout — dashboards need predictable alignment
+
+        RISKS (where you'd stand out):
+          Instrument Serif for display headings — nobody in dev tools
+            uses a serif. It creates instant hierarchy contrast and
+            signals "we care about craft" in a space full of sans-serifs.
+          Single teal accent instead of blue — everyone else in this space uses blue.
+            Teal is close enough to feel trustworthy, different enough
+            to be recognizable.
+          4px compact density — tighter than Linear, says "we respect
+            your screen real estate."
+
+        The safe choices keep you literate. The risks are where your
+        product gets its own face. Which risks appeal to you?
+
+You:    Love the serif risk. Let's see it.
+
+Claude: Preview opened in your browser.
+        [/tmp/design-consultation-preview-1710000000.html]
+
+        The page shows a realistic dashboard: sidebar nav, header with
+        avatar, stat cards, data table — all in your design system.
+        Instrument Serif at hero scale, Geist in body text, JetBrains
+        Mono in the data table. Teal accent on buttons and active states.
+        Light and dark mode toggle in the corner.
+
+        How does it feel? Want to adjust anything before I write DESIGN.md?
+
+You:    Ship it.
+
+Claude: Wrote DESIGN.md (typography, color, spacing, layout, motion).
+        Updated CLAUDE.md with design system guidelines.
+        All future sessions will respect these choices.
+```
+
+---
+
+## `/qa-design-review`
+
+This is my **designer who codes mode**.
+
+`/plan-design-review` tells you what is wrong. `/qa-design-review` fixes it.
+
+It runs the same 80-item audit, then enters a fix loop: for each design finding, it locates the source file, makes the minimal CSS/styling change, commits with `style(design): FINDING-NNN`, re-navigates to verify, and takes before/after screenshots. One commit per fix, fully bisectable.
+
+The self-regulation heuristic is tuned for design work — CSS-only changes get a free pass (they are inherently safe and reversible), but changes to component JSX/TSX files count against the risk budget. Hard cap at 30 fixes. If the risk score exceeds 20%, it stops and asks.
+
+### Example
+
+```
+You:   /qa-design-review https://myapp.com
+
+Claude: [Runs full design audit — same output as /plan-design-review]
+        Design Score: C  |  AI Slop Score: D
+        12 findings (4 high, 5 medium, 3 polish)
+
+        Fixing 9 design issues...
+
+        style(design): FINDING-001 — replace 3-column icon grid with asymmetric layout
+        style(design): FINDING-002 — add heading scale 48/32/24/18/16
+        style(design): FINDING-003 — remove gradient hero, use bold typography
+        style(design): FINDING-004 — add second font for headings
+        style(design): FINDING-005 — vary border-radius by element role
+        style(design): FINDING-006 — left-align body text, reserve center for headings
+        style(design): FINDING-007 — add hover/focus states to all interactive elements
+        style(design): FINDING-008 — add prefers-reduced-motion media query
+        style(design): FINDING-009 — set max content width to 680px for body text
+
+        Final audit:
+        Design Score: C → B+  |  AI Slop Score: D → A
+        9 fixes applied (8 verified, 1 best-effort). 3 deferred.
+
+        [Report with before/after screenshots saved to .gstack/design-reports/]
+```
+
+Nine commits, each touching one concern. The AI Slop score went from D to A because the three most recognizable patterns (gradient hero, 3-column grid, uniform radius) are gone.
+
+---
+
+## `/review`
+
+This is my **paranoid staff engineer mode**.
+
+Passing tests do not mean the branch is safe.
+
+`/review` exists because there is a whole class of bugs that can survive CI and still punch you in the face in production. This mode is not about dreaming bigger. It is not about making the plan prettier. It is about asking:
+
+**What can still break?**
+
+This is a structural audit, not a style nitpick pass. I want the model to look for things like:
+
+* N+1 queries
+* stale reads
+* race conditions
+* bad trust boundaries
+* missing indexes
+* escaping bugs
+* broken invariants
+* bad retry logic
+* tests that pass while missing the real failure mode
+* forgotten enum handlers — add a new status or type constant, and `/review` traces it through every switch statement and allowlist in your codebase, not just the files you changed
+
+### Fix-First
+
+Findings get action, not just listed. Obvious mechanical fixes (dead code, stale comments, N+1 queries) are applied automatically — you see `[AUTO-FIXED] file:line Problem → what was done` for each one. Genuinely ambiguous issues (security, race conditions, design decisions) get surfaced for your call.
+
+### Completeness gaps
+
+`/review` now flags shortcut implementations where the complete version costs less than 30 minutes of CC time. If you chose the 80% solution and the 100% solution is a lake, not an ocean, the review will call it out.
+
+### Example
+
+Suppose the smart listing flow is implemented and the tests are green.
+
+`/review` should still ask:
+
+* Did I introduce an N+1 query when rendering listing photos or draft suggestions?
+* Am I trusting client-provided file metadata instead of validating the actual file?
+* Can two tabs race and overwrite cover-photo selection or item details?
+* Do failed uploads leave orphaned files in storage forever?
+* Can the "exactly one hero image" rule break under concurrency?
+* If enrichment APIs partially fail, do I degrade gracefully or save garbage?
+* Did I accidentally create a prompt injection or trust-boundary problem by pulling web data into draft generation?
+
+That is the point of `/review`.
+
+I do not want flattery here.
+I want the model imagining the production incident before it happens.
+
+---
+
+## `/ship`
+
+This is my **release machine mode**.
+
+Once I have decided what to build, nailed the technical plan, and run a serious review, I do not want more talking. I want execution.
+
+`/ship` is for the final mile. It is for a ready branch, not for deciding what to build.
+
+This is where the model should stop behaving like a brainstorm partner and start behaving like a disciplined release engineer: sync with main, run the right tests, make sure the branch state is sane, update changelog or versioning if the repo expects it, push, and create or update the PR.
+
+### Test bootstrap
+
+If your project doesn't have a test framework, `/ship` sets one up — detects your runtime, researches the best framework, installs it, writes 3-5 real tests for your actual code, sets up CI/CD (GitHub Actions), and creates TESTING.md. 100% test coverage is the goal — tests make vibe coding safe instead of yolo coding.
+
+### Coverage audit
+
+Every `/ship` run builds a code path map from your diff, searches for corresponding tests, and produces an ASCII coverage diagram with quality stars. Gaps get tests auto-generated. Your PR body shows the coverage: `Tests: 42 → 47 (+5 new)`.
+
+### Review gate
+
+`/ship` checks the [Review Readiness Dashboard](#review-readiness-dashboard) before creating the PR. If the Eng Review is missing, it asks — but won't block you. Decisions are saved per-branch so you're never re-asked.
+
+A lot of branches die when the interesting work is done and only the boring release work is left. Humans procrastinate that part. AI should not.
+
+---
+
+## `/browse`
+
+This is my **QA engineer mode**.
+
+`/browse` is the skill that closes the loop. Before it, the agent could think and code but was still half blind. It had to guess about UI state, auth flows, redirects, console errors, empty states, and broken layouts. Now it can just go look.
+
+It is a compiled binary that talks to a persistent Chromium daemon — built on [Playwright](https://playwright.dev/) by Microsoft. First call starts the browser (~3s). Every call after that: ~100-200ms. The browser stays running between commands, so cookies, tabs, and localStorage carry over.
+
+### Example
+
+```
+You:   /browse staging.myapp.com — log in, test the signup flow, and check
+       every page I changed in this branch
+
+Claude: [18 tool calls, ~60 seconds]
+
+        > browse goto https://staging.myapp.com/signup
+        > browse snapshot -i
+        > browse fill @e2 "test@example.com"
+        > browse fill @e3 "password123"
+        > browse click @e5                    (Submit)
+        > browse screenshot /tmp/signup.png
+        > Read /tmp/signup.png
+
+        Signup works. Redirected to onboarding. Now checking changed pages.
+
+        > browse goto https://staging.myapp.com/dashboard
+        > browse screenshot /tmp/dashboard.png
+        > Read /tmp/dashboard.png
+        > browse console
+
+        Dashboard loads. No console errors. Charts render with sample data.
+
+        All 4 pages load correctly. No console errors. No broken layouts.
+        Signup → onboarding → dashboard flow works end to end.
+```
+
+18 tool calls, about a minute. Full QA pass. No browser opened.
+
+**Security note:** `/browse` runs a persistent Chromium session. Cookies, localStorage, and session state carry over between commands. Do not use it against sensitive production environments unless you intend to — it is a real browser with real state. The session auto-shuts down after 30 minutes of idle time.
+
+For the full command reference, see [BROWSER.md](../BROWSER.md).
+
+---
+
+## `/qa`
+
+This is my **QA lead mode**.
+
+`/browse` gives the agent eyes. `/qa` gives it a testing methodology.
+
+The most common use case: you're on a feature branch, you just finished coding, and you want to verify everything works. Just say `/qa` — it reads your git diff, identifies which pages and routes your changes affect, spins up the browser, and tests each one. No URL required. No manual test plan.
+
+Four modes:
+
+- **Diff-aware** (automatic on feature branches) — reads `git diff main`, identifies affected pages, tests them specifically
+- **Full** — systematic exploration of the entire app. 5-15 minutes. Documents 5-10 well-evidenced issues.
+- **Quick** (`--quick`) — 30-second smoke test. Homepage + top 5 nav targets.
+- **Regression** (`--regression baseline.json`) — run full mode, then diff against a previous baseline.
+
+### Automatic regression tests
+
+When `/qa` fixes a bug and verifies it, it automatically generates a regression test that catches the exact scenario that broke. Tests include full attribution tracing back to the QA report.
+
+### Example
+
+```
+You:   /qa https://staging.myapp.com
+
+Claude: [Explores 12 pages, fills 3 forms, tests 2 flows]
+
+        QA Report: staging.myapp.com — Health Score: 72/100
+
+        Top 3 Issues:
+        1. CRITICAL: Checkout form submits with empty required fields
+        2. HIGH: Mobile nav menu doesn't close after selecting an item
+        3. MEDIUM: Dashboard chart overlaps sidebar below 1024px
+
+        [Full report with screenshots saved to .gstack/qa-reports/]
+```
+
+**Testing authenticated pages:** Use `/setup-browser-cookies` first to import your real browser sessions, then `/qa` can test pages behind login.
+
+---
+
+## `/setup-browser-cookies`
+
+This is my **session manager mode**.
+
+Before `/qa` or `/browse` can test authenticated pages, they need cookies. Instead of manually logging in through the headless browser every time, `/setup-browser-cookies` imports your real sessions directly from your daily browser.
+
+It auto-detects installed Chromium browsers (Comet, Chrome, Arc, Brave, Edge), decrypts cookies via the macOS Keychain, and loads them into the Playwright session. An interactive picker UI lets you choose exactly which domains to import — no cookie values are ever displayed.
+
+```
+You:   /setup-browser-cookies
+
+Claude: Cookie picker opened — select the domains you want to import
+        in your browser, then tell me when you're done.
+
+        [You pick github.com, myapp.com in the browser UI]
+
+You:    done
+
+Claude: Imported 2 domains (47 cookies). Session is ready.
+```
+
+Or skip the UI entirely:
+
+```
+You:   /setup-browser-cookies github.com
+
+Claude: Imported 12 cookies for github.com from Comet.
+```
+
+---
+
+## `/retro`
+
+This is my **engineering manager mode**.
+
+At the end of the week I want to know what actually happened. Not vibes — data. `/retro` analyzes commit history, work patterns, and shipping velocity and writes a candid retrospective.
+
+It is team-aware. It identifies who is running the command, gives you the deepest treatment on your own work, then breaks down every contributor with specific praise and growth opportunities. It computes metrics like commits, LOC, test ratio, PR sizes, and fix ratio. It detects coding sessions from commit timestamps, finds hotspot files, tracks shipping streaks, and identifies the biggest ship of the week.
+
+It also tracks test health: total test files, tests added this period, regression test commits, and trend deltas. If test ratio drops below 20%, it flags it as a growth area.
+
+### Example
+
+```
+You:   /retro
+
+Claude: Week of Mar 1: 47 commits (3 contributors), 3.2k LOC, 38% tests, 12 PRs, peak: 10pm | Streak: 47d
+
+        ## Your Week
+        32 commits, +2.4k LOC, 41% tests. Peak hours: 9-11pm.
+        Biggest ship: cookie import system (browser decryption + picker UI).
+        What you did well: shipped a complete feature with encryption, UI, and
+        18 unit tests in one focused push...
+
+        ## Team Breakdown
+
+        ### Alice
+        12 commits focused on app/services/. Every PR under 200 LOC — disciplined.
+        Opportunity: test ratio at 12% — worth investing before payment gets more complex.
+
+        ### Bob
+        3 commits — fixed the N+1 query on dashboard. Small but high-impact.
+        Opportunity: only 1 active day this week — check if blocked on anything.
+
+        [Top 3 team wins, 3 things to improve, 3 habits for next week]
+```
+
+It saves a JSON snapshot to `.context/retros/` so the next run can show trends.
+
+---
+
+## `/document-release`
+
+This is my **technical writer mode**.
+
+After `/ship` creates the PR but before it merges, `/document-release` reads every documentation file in the project and cross-references it against the diff. It updates file paths, command lists, project structure trees, and anything else that drifted. Risky or subjective changes get surfaced as questions — everything else is handled automatically.
+
+```
+You:   /document-release
+
+Claude: Analyzing 21 files changed across 3 commits. Found 8 documentation files.
+
+        README.md: updated skill count from 9 to 10, added new skill to table
+        CLAUDE.md: added new directory to project structure
+        CONTRIBUTING.md: current — no changes needed
+        TODOS.md: marked 2 items complete, added 1 new item
+
+        All docs updated and committed. PR body updated with doc diff.
+```
+
+It also polishes CHANGELOG voice (without ever overwriting entries), cleans up completed TODOS, checks cross-doc consistency, and asks about VERSION bumps only when appropriate.
+
+---
+
+## Greptile integration
+
+[Greptile](https://greptile.com) is a YC company that reviews your PRs automatically. It catches real bugs — race conditions, security issues, things that pass CI and blow up in production. It has genuinely saved my ass more than once. I love these guys.
+
+### Setup
+
+Install Greptile on your GitHub repo at [greptile.com](https://greptile.com) — it takes about 30 seconds. Once it's reviewing your PRs, gstack picks up its comments automatically. No additional configuration.
+
+### How it works
+
+The problem with any automated reviewer is triage. Greptile is good, but not every comment is a real issue. Some are false positives. Some flag things you already fixed three commits ago. Without a triage layer, the comments pile up and you start ignoring them — which defeats the purpose.
+
+gstack solves this. `/review` and `/ship` are now Greptile-aware. They read Greptile's comments, classify each one, and take action:
+
+- **Valid issues** get added to the critical findings and fixed before shipping
+- **Already-fixed issues** get an auto-reply acknowledging the catch
+- **False positives** get pushed back — you confirm, and a reply goes out explaining why it's wrong
+
+The result is a two-layer review: Greptile catches things asynchronously on the PR, then `/review` and `/ship` triage those findings as part of the normal workflow. Nothing falls through the cracks.
+
+### Learning from history
+
+Every false positive you confirm gets saved to `~/.gstack/greptile-history.md`. Future runs auto-skip known FP patterns for your codebase. And `/retro` tracks Greptile's batting average over time — so you can see whether the signal-to-noise ratio is improving.
+
+### Example
+
+```
+You:   /ship
+
+Claude: [syncs main, runs tests, pre-landing review...]
+
+        Greptile found 3 comments on this PR:
+
+        [VALID] app/services/payment_service.rb:47 — Race condition:
+        concurrent charges can double-debit. Recommend DB-level advisory
+        lock around the charge block.
+
+        [ALREADY FIXED] app/models/user.rb:12 — Missing null check
+        on email before downcase.
+        → Already fixed in commit abc1234. Auto-replying.
+
+        [FALSE POSITIVE] lib/auth.rb:88 — "Token comparison should
+        use constant-time comparison." We already use
+        ActiveSupport::SecurityUtils.secure_compare here.
+
+        Fixing the race condition in payment_service.rb...
+
+        The auth token comment is a false positive.
+        Options: A) Reply to Greptile explaining  B) Fix anyway  C) Ignore
+
+You:    A
+
+Claude: Replied to Greptile. All tests pass.
+        PR: github.com/you/app/pull/42
+```
+
+Three Greptile comments. One real fix. One auto-acknowledged. One false positive pushed back with a reply. Total extra time: about 30 seconds.
diff --git a/document-release/SKILL.md b/document-release/SKILL.md
index 694d64da..bc8ff4ca 100644
--- a/document-release/SKILL.md
+++ b/document-release/SKILL.md
@@ -29,22 +29,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
diff --git a/plan-ceo-review/SKILL.md b/plan-ceo-review/SKILL.md
index 7f48cbe7..d7953a92 100644
--- a/plan-ceo-review/SKILL.md
+++ b/plan-ceo-review/SKILL.md
@@ -28,22 +28,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
@@ -109,6 +148,7 @@ But your posture depends on what the user needs:
 * SELECTIVE EXPANSION: You are a rigorous reviewer who also has taste. Hold the current scope as your baseline — make it bulletproof. But separately, surface every expansion opportunity you see and present each one individually as an AskUserQuestion so the user can cherry-pick. Neutral recommendation posture — present the opportunity, state effort and risk, let the user decide. Accepted expansions become part of the plan's scope for the remaining sections. Rejected ones go to "NOT in scope."
 * HOLD SCOPE: You are a rigorous reviewer. The plan's scope is accepted. Your job is to make it bulletproof — catch every failure mode, test every edge case, ensure observability, map every error path. Do not silently reduce OR expand.
 * SCOPE REDUCTION: You are a surgeon. Find the minimum viable version that achieves the core outcome. Cut everything else. Be ruthless.
+* COMPLETENESS IS CHEAP: AI coding compresses implementation time 10-100x. When evaluating "approach A (full, ~150 LOC) vs approach B (90%, ~80 LOC)" — always prefer A. The 70-line delta costs seconds with CC. "Ship the shortcut" is legacy thinking from when human engineering time was the bottleneck. Boil the lake.
 Critical rule: In ALL modes, the user is 100% in control. Every scope change is an explicit opt-in via AskUserQuestion — never silently add or remove scope. Once the user selects a mode, COMMIT to it. Do not silently drift toward a different mode. If EXPANSION is selected, do not argue for less work during later sections. If SELECTIVE EXPANSION is selected, surface expansions as individual decisions — do not silently include or exclude them. If REDUCTION is selected, do not sneak scope back in. Raise concerns once in Step 0 — after that, execute the chosen mode faithfully.
 Do NOT make any code changes. Do NOT start implementation. Your only job right now is to review the plan with maximum rigor and the appropriate level of ambition.
 
@@ -269,6 +309,11 @@ Think ahead to implementation: What decisions will need to be made during implem
   HOUR 4-5 (integration):  What will surprise them?
   HOUR 6+ (polish/tests):  What will they wish they'd planned for?
 ```
+NOTE: These represent human-team implementation hours. With CC + gstack,
+6 hours of human implementation compresses to ~30-60 minutes. The decisions
+are identical — the implementation speed is 10-20x faster. Always present
+both scales when discussing effort.
+
 Surface these as questions for the user NOW, not as "figure it out later."
 
 ### 0F. Mode Selection
@@ -548,7 +593,7 @@ For each TODO, describe:
 * **Pros:** What you gain by doing this work.
 * **Cons:** Cost, complexity, or risks of doing it.
 * **Context:** Enough detail that someone picking this up in 3 months understands the motivation, the current state, and where to start.
-* **Effort estimate:** S/M/L/XL
+* **Effort estimate:** S/M/L/XL (human team) → with CC+gstack: S→S, M→S, L→M, XL→L
 * **Priority:** P1/P2/P3
 * **Depends on / blocked by:** Any prerequisites or ordering constraints.
 
@@ -598,6 +643,7 @@ List every ASCII diagram in files this plan touches. Still accurate?
   | TODOS.md updates     | ___ items proposed                          |
   | Scope proposals      | ___ proposed, ___ accepted (EXP + SEL)      |
   | CEO plan             | written / skipped (HOLD/REDUCTION)           |
+  | Lake Score           | X/Y recommendations chose complete option   |
   | Diagrams produced    | ___ (list types)                            |
   | Stale diagrams found | ___                                         |
   | Unresolved decisions | ___ (listed below)                          |
diff --git a/plan-ceo-review/SKILL.md.tmpl b/plan-ceo-review/SKILL.md.tmpl
index 3165dc5b..8695dd8b 100644
--- a/plan-ceo-review/SKILL.md.tmpl
+++ b/plan-ceo-review/SKILL.md.tmpl
@@ -27,6 +27,7 @@ But your posture depends on what the user needs:
 * SELECTIVE EXPANSION: You are a rigorous reviewer who also has taste. Hold the current scope as your baseline — make it bulletproof. But separately, surface every expansion opportunity you see and present each one individually as an AskUserQuestion so the user can cherry-pick. Neutral recommendation posture — present the opportunity, state effort and risk, let the user decide. Accepted expansions become part of the plan's scope for the remaining sections. Rejected ones go to "NOT in scope."
 * HOLD SCOPE: You are a rigorous reviewer. The plan's scope is accepted. Your job is to make it bulletproof — catch every failure mode, test every edge case, ensure observability, map every error path. Do not silently reduce OR expand.
 * SCOPE REDUCTION: You are a surgeon. Find the minimum viable version that achieves the core outcome. Cut everything else. Be ruthless.
+* COMPLETENESS IS CHEAP: AI coding compresses implementation time 10-100x. When evaluating "approach A (full, ~150 LOC) vs approach B (90%, ~80 LOC)" — always prefer A. The 70-line delta costs seconds with CC. "Ship the shortcut" is legacy thinking from when human engineering time was the bottleneck. Boil the lake.
 Critical rule: In ALL modes, the user is 100% in control. Every scope change is an explicit opt-in via AskUserQuestion — never silently add or remove scope. Once the user selects a mode, COMMIT to it. Do not silently drift toward a different mode. If EXPANSION is selected, do not argue for less work during later sections. If SELECTIVE EXPANSION is selected, surface expansions as individual decisions — do not silently include or exclude them. If REDUCTION is selected, do not sneak scope back in. Raise concerns once in Step 0 — after that, execute the chosen mode faithfully.
 Do NOT make any code changes. Do NOT start implementation. Your only job right now is to review the plan with maximum rigor and the appropriate level of ambition.
 
@@ -187,6 +188,11 @@ Think ahead to implementation: What decisions will need to be made during implem
   HOUR 4-5 (integration):  What will surprise them?
   HOUR 6+ (polish/tests):  What will they wish they'd planned for?
 ```
+NOTE: These represent human-team implementation hours. With CC + gstack,
+6 hours of human implementation compresses to ~30-60 minutes. The decisions
+are identical — the implementation speed is 10-20x faster. Always present
+both scales when discussing effort.
+
 Surface these as questions for the user NOW, not as "figure it out later."
 
 ### 0F. Mode Selection
@@ -466,7 +472,7 @@ For each TODO, describe:
 * **Pros:** What you gain by doing this work.
 * **Cons:** Cost, complexity, or risks of doing it.
 * **Context:** Enough detail that someone picking this up in 3 months understands the motivation, the current state, and where to start.
-* **Effort estimate:** S/M/L/XL
+* **Effort estimate:** S/M/L/XL (human team) → with CC+gstack: S→S, M→S, L→M, XL→L
 * **Priority:** P1/P2/P3
 * **Depends on / blocked by:** Any prerequisites or ordering constraints.
 
@@ -516,6 +522,7 @@ List every ASCII diagram in files this plan touches. Still accurate?
   | TODOS.md updates     | ___ items proposed                          |
   | Scope proposals      | ___ proposed, ___ accepted (EXP + SEL)      |
   | CEO plan             | written / skipped (HOLD/REDUCTION)           |
+  | Lake Score           | X/Y recommendations chose complete option   |
   | Diagrams produced    | ___ (list types)                            |
   | Stale diagrams found | ___                                         |
   | Unresolved decisions | ___ (listed below)                          |
diff --git a/plan-design-review/SKILL.md b/plan-design-review/SKILL.md
index df5b43e8..f0b2fddd 100644
--- a/plan-design-review/SKILL.md
+++ b/plan-design-review/SKILL.md
@@ -29,22 +29,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
diff --git a/plan-eng-review/SKILL.md b/plan-eng-review/SKILL.md
index d4e9a83e..d2292af6 100644
--- a/plan-eng-review/SKILL.md
+++ b/plan-eng-review/SKILL.md
@@ -28,22 +28,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
@@ -110,6 +149,8 @@ Before reviewing anything, answer these questions:
 3. **Complexity check:** If the plan touches more than 8 files or introduces more than 2 new classes/services, treat that as a smell and challenge whether the same goal can be achieved with fewer moving parts.
 4. **TODOS cross-reference:** Read `TODOS.md` if it exists. Are any deferred items blocking this plan? Can any deferred items be bundled into this PR without expanding scope? Does this plan create new work that should be captured as a TODO?
 
+5. **Completeness check:** Is the plan doing the complete version or a shortcut? With AI-assisted coding, the cost of completeness (100% test coverage, full edge case handling, complete error paths) is 10-100x cheaper than with a human team. If the plan proposes a shortcut that saves human-hours but only saves minutes with CC+gstack, recommend the complete version. Boil the lake.
+
 If the complexity check triggers (8+ files or 2+ new classes/services), proactively recommend scope reduction via AskUserQuestion — explain what's overbuilt, propose a minimal version that achieves the core goal, and ask whether to reduce or proceed as-is. If the complexity check does not trigger, present your Step 0 findings and proceed directly to Section 1.
 
 Always work through the full interactive review: one section at a time (Architecture → Code Quality → Tests → Performance) with at most 8 top issues per section.
@@ -196,7 +237,7 @@ Follow the AskUserQuestion format from the Preamble above. Additional rules for
 * **One issue = one AskUserQuestion call.** Never combine multiple issues into one question.
 * Describe the problem concretely, with file and line references.
 * Present 2-3 options, including "do nothing" where that's reasonable.
-* For each option, specify in one line: effort, risk, and maintenance burden.
+* For each option, specify in one line: effort (human: ~X / CC: ~Y), risk, and maintenance burden. If the complete option is only marginally more effort than the shortcut with CC, recommend the complete option.
 * **Map the reasoning to my engineering preferences above.** One sentence connecting your recommendation to a specific preference (DRY, explicit > clever, minimal diff, etc.).
 * Label with issue NUMBER + option LETTER (e.g., "3A", "3B").
 * **Escape hatch:** If a section has no issues, say so and move on. If an issue has an obvious fix with no real alternatives, state what you'll do and move on — don't waste a question on it. Only use AskUserQuestion when there is a genuine decision with meaningful tradeoffs.
@@ -246,6 +287,7 @@ At the end of the review, fill in and display this summary so the user can see a
 - What already exists: written
 - TODOS.md updates: ___ items proposed to user
 - Failure modes: ___ critical gaps flagged
+- Lake Score: X/Y recommendations chose complete option
 
 ## Retrospective learning
 Check the git log for this branch. If there are prior commits suggesting a previous review cycle (e.g., review-driven refactors, reverted changes), note what was changed and whether the current plan touches the same areas. Be more aggressive reviewing areas that were previously problematic.
diff --git a/plan-eng-review/SKILL.md.tmpl b/plan-eng-review/SKILL.md.tmpl
index 3433cb75..bf033606 100644
--- a/plan-eng-review/SKILL.md.tmpl
+++ b/plan-eng-review/SKILL.md.tmpl
@@ -45,6 +45,8 @@ Before reviewing anything, answer these questions:
 3. **Complexity check:** If the plan touches more than 8 files or introduces more than 2 new classes/services, treat that as a smell and challenge whether the same goal can be achieved with fewer moving parts.
 4. **TODOS cross-reference:** Read `TODOS.md` if it exists. Are any deferred items blocking this plan? Can any deferred items be bundled into this PR without expanding scope? Does this plan create new work that should be captured as a TODO?
 
+5. **Completeness check:** Is the plan doing the complete version or a shortcut? With AI-assisted coding, the cost of completeness (100% test coverage, full edge case handling, complete error paths) is 10-100x cheaper than with a human team. If the plan proposes a shortcut that saves human-hours but only saves minutes with CC+gstack, recommend the complete version. Boil the lake.
+
 If the complexity check triggers (8+ files or 2+ new classes/services), proactively recommend scope reduction via AskUserQuestion — explain what's overbuilt, propose a minimal version that achieves the core goal, and ask whether to reduce or proceed as-is. If the complexity check does not trigger, present your Step 0 findings and proceed directly to Section 1.
 
 Always work through the full interactive review: one section at a time (Architecture → Code Quality → Tests → Performance) with at most 8 top issues per section.
@@ -131,7 +133,7 @@ Follow the AskUserQuestion format from the Preamble above. Additional rules for
 * **One issue = one AskUserQuestion call.** Never combine multiple issues into one question.
 * Describe the problem concretely, with file and line references.
 * Present 2-3 options, including "do nothing" where that's reasonable.
-* For each option, specify in one line: effort, risk, and maintenance burden.
+* For each option, specify in one line: effort (human: ~X / CC: ~Y), risk, and maintenance burden. If the complete option is only marginally more effort than the shortcut with CC, recommend the complete option.
 * **Map the reasoning to my engineering preferences above.** One sentence connecting your recommendation to a specific preference (DRY, explicit > clever, minimal diff, etc.).
 * Label with issue NUMBER + option LETTER (e.g., "3A", "3B").
 * **Escape hatch:** If a section has no issues, say so and move on. If an issue has an obvious fix with no real alternatives, state what you'll do and move on — don't waste a question on it. Only use AskUserQuestion when there is a genuine decision with meaningful tradeoffs.
@@ -181,6 +183,7 @@ At the end of the review, fill in and display this summary so the user can see a
 - What already exists: written
 - TODOS.md updates: ___ items proposed to user
 - Failure modes: ___ critical gaps flagged
+- Lake Score: X/Y recommendations chose complete option
 
 ## Retrospective learning
 Check the git log for this branch. If there are prior commits suggesting a previous review cycle (e.g., review-driven refactors, reverted changes), note what was changed and whether the current plan touches the same areas. Be more aggressive reviewing areas that were previously problematic.
diff --git a/qa-design-review/SKILL.md b/qa-design-review/SKILL.md
index 7044c560..1d6200c5 100644
--- a/qa-design-review/SKILL.md
+++ b/qa-design-review/SKILL.md
@@ -31,22 +31,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
diff --git a/qa-only/SKILL.md b/qa-only/SKILL.md
index 4fa0cf04..594979b9 100644
--- a/qa-only/SKILL.md
+++ b/qa-only/SKILL.md
@@ -27,22 +27,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
diff --git a/qa/SKILL.md b/qa/SKILL.md
index c01514cf..10e50715 100644
--- a/qa/SKILL.md
+++ b/qa/SKILL.md
@@ -33,22 +33,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
diff --git a/retro/SKILL.md b/retro/SKILL.md
index e7cd3d2c..71eab988 100644
--- a/retro/SKILL.md
+++ b/retro/SKILL.md
@@ -27,22 +27,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
diff --git a/review/SKILL.md b/review/SKILL.md
index 3ad683d6..186978ef 100644
--- a/review/SKILL.md
+++ b/review/SKILL.md
@@ -28,22 +28,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
diff --git a/review/checklist.md b/review/checklist.md
index e2246050..282c9944 100644
--- a/review/checklist.md
+++ b/review/checklist.md
@@ -84,6 +84,12 @@ To do this: use Grep to find all references to the sibling values (e.g., grep fo
 - `.expects(:something).never` missing when a code path should explicitly NOT call an external service
 - Security enforcement features (blocking, rate limiting, auth) without integration tests verifying the enforcement path works end-to-end
 
+#### Completeness Gaps
+- Shortcut implementations where the complete version would cost <30 minutes CC time (e.g., partial enum handling, incomplete error paths, missing edge cases that are straightforward to add)
+- Options presented with only human-team effort estimates — should show both human and CC+gstack time
+- Test coverage gaps where adding the missing tests is a "lake" not an "ocean" (e.g., missing negative-path tests, missing edge case tests that mirror happy-path structure)
+- Features implemented at 80-90% when 100% is achievable with modest additional code
+
 #### Crypto & Entropy
 - Truncation of data instead of hashing (last N chars instead of SHA-256) — less entropy, easier collisions
 - `rand()` / `Random.rand` for security-sensitive values — use `SecureRandom` instead
@@ -113,6 +119,7 @@ CRITICAL (highest severity):      INFORMATIONAL (lower severity):
 ├─ LLM Output Trust Boundary      ├─ Dead Code & Consistency
 └─ Enum & Value Completeness      ├─ LLM Prompt Issues
                                    ├─ Test Gaps
+                                   ├─ Completeness Gaps
                                    ├─ Crypto & Entropy
                                    ├─ Time Window Safety
                                    ├─ Type Coercion at Boundaries
diff --git a/scripts/gen-skill-docs.ts b/scripts/gen-skill-docs.ts
index 31684e21..d2e86ecf 100644
--- a/scripts/gen-skill-docs.ts
+++ b/scripts/gen-skill-docs.ts
@@ -107,22 +107,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 \`\`\`
 
 If output shows \`UPGRADE_AVAILABLE <old> <new>\`: read \`~/.claude/skills/gstack/gstack-upgrade/SKILL.md\` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If \`JUST_UPGRADED <from> <to>\`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If \`LAKE_INTRO\` is \`no\`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+\`\`\`bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+\`\`\`
+
+Only run \`open\` if the user says yes. Always run \`touch\` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the \`_BRANCH\` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** \`RECOMMENDATION: Choose [X] because [one-line reason]\`
-4. **Options:** Lettered options: \`A) ... B) ... C) ...\`
+3. **Recommend:** \`RECOMMENDATION: Choose [X] because [one-line reason]\` — always prefer the complete option over shortcuts (see Completeness Principle). Include \`Completeness: X/10\` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: \`A) ... B) ... C) ...\` — when an option involves effort, show both scales: \`(human: ~X / CC: ~Y)\`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If \`_CONTRIB\` is \`true\`: you are in **contributor mode**. You're a gstack user who also helps make it better.
diff --git a/setup-browser-cookies/SKILL.md b/setup-browser-cookies/SKILL.md
index faebe520..da64dec4 100644
--- a/setup-browser-cookies/SKILL.md
+++ b/setup-browser-cookies/SKILL.md
@@ -25,22 +25,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
diff --git a/ship/SKILL.md b/ship/SKILL.md
index 32582088..e2b524d9 100644
--- a/ship/SKILL.md
+++ b/ship/SKILL.md
@@ -28,22 +28,61 @@ find ~/.gstack/sessions -mmin +120 -type f -delete 2>/dev/null || true
 _CONTRIB=$(~/.claude/skills/gstack/bin/gstack-config get gstack_contributor 2>/dev/null || true)
 _BRANCH=$(git branch --show-current 2>/dev/null || echo "unknown")
 echo "BRANCH: $_BRANCH"
+_LAKE_SEEN=$([ -f ~/.gstack/.completeness-intro-seen ] && echo "yes" || echo "no")
+echo "LAKE_INTRO: $_LAKE_SEEN"
 ```
 
 If output shows `UPGRADE_AVAILABLE <old> <new>`: read `~/.claude/skills/gstack/gstack-upgrade/SKILL.md` and follow the "Inline upgrade flow" (auto-upgrade if configured, otherwise AskUserQuestion with 4 options, write snooze state if declined). If `JUST_UPGRADED <from> <to>`: tell user "Running gstack v{to} (just updated!)" and continue.
 
+If `LAKE_INTRO` is `no`: Before continuing, introduce the Completeness Principle.
+Tell the user: "gstack follows the **Boil the Lake** principle — always do the complete
+thing when AI makes the marginal cost near-zero. Read more: https://garryslist.org/posts/boil-the-ocean"
+Then offer to open the essay in their default browser:
+
+```bash
+open https://garryslist.org/posts/boil-the-ocean
+touch ~/.gstack/.completeness-intro-seen
+```
+
+Only run `open` if the user says yes. Always run `touch` to mark as seen. This only happens once.
+
 ## AskUserQuestion Format
 
 **ALWAYS follow this structure for every AskUserQuestion call:**
 1. **Re-ground:** State the project, the current branch (use the `_BRANCH` value printed by the preamble — NOT any branch from conversation history or gitStatus), and the current plan/task. (1-2 sentences)
 2. **Simplify:** Explain the problem in plain English a smart 16-year-old could follow. No raw function names, no internal jargon, no implementation details. Use concrete examples and analogies. Say what it DOES, not what it's called.
-3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]`
-4. **Options:** Lettered options: `A) ... B) ... C) ...`
+3. **Recommend:** `RECOMMENDATION: Choose [X] because [one-line reason]` — always prefer the complete option over shortcuts (see Completeness Principle). Include `Completeness: X/10` for each option. Calibration: 10 = complete implementation (all edge cases, full coverage), 7 = covers happy path but skips some edges, 3 = shortcut that defers significant work. If both options are 8+, pick the higher; if one is ≤5, flag it.
+4. **Options:** Lettered options: `A) ... B) ... C) ...` — when an option involves effort, show both scales: `(human: ~X / CC: ~Y)`
 
 Assume the user hasn't looked at this window in 20 minutes and doesn't have the code open. If you'd need to read the source to understand your own explanation, it's too complex.
 
 Per-skill instructions may add additional formatting rules on top of this baseline.
 
+## Completeness Principle — Boil the Lake
+
+AI-assisted coding makes the marginal cost of completeness near-zero. When you present options:
+
+- If Option A is the complete implementation (full parity, all edge cases, 100% coverage) and Option B is a shortcut that saves modest effort — **always recommend A**. The delta between 80 lines and 150 lines is meaningless with CC+gstack. "Good enough" is the wrong instinct when "complete" costs minutes more.
+- **Lake vs. ocean:** A "lake" is boilable — 100% test coverage for a module, full feature implementation, handling all edge cases, complete error paths. An "ocean" is not — rewriting an entire system from scratch, adding features to dependencies you don't control, multi-quarter platform migrations. Recommend boiling lakes. Flag oceans as out of scope.
+- **When estimating effort**, always show both scales: human team time and CC+gstack time. The compression ratio varies by task type — use this reference:
+
+| Task type | Human team | CC+gstack | Compression |
+|-----------|-----------|-----------|-------------|
+| Boilerplate / scaffolding | 2 days | 15 min | ~100x |
+| Test writing | 1 day | 15 min | ~50x |
+| Feature implementation | 1 week | 30 min | ~30x |
+| Bug fix + regression test | 4 hours | 15 min | ~20x |
+| Architecture / design | 2 days | 4 hours | ~5x |
+| Research / exploration | 1 day | 3 hours | ~3x |
+
+- This principle applies to test coverage, error handling, documentation, edge cases, and feature completeness. Don't skip the last 10% to "save time" — with AI, that 10% costs seconds.
+
+**Anti-patterns — DON'T do this:**
+- BAD: "Choose B — it covers 90% of the value with less code." (If A is only 70 lines more, choose A.)
+- BAD: "We can skip edge case handling to save time." (Edge case handling costs minutes with CC.)
+- BAD: "Let's defer test coverage to a follow-up PR." (Tests are the cheapest lake to boil.)
+- BAD: Quoting only human-team effort: "This would take 2 weeks." (Say: "2 weeks human / ~1 hour CC.")
+
 ## Contributor Mode
 
 If `_CONTRIB` is `true`: you are in **contributor mode**. You're a gstack user who also helps make it better.
diff --git a/test/skill-e2e.test.ts b/test/skill-e2e.test.ts
index 2ea56da9..021e41da 100644
--- a/test/skill-e2e.test.ts
+++ b/test/skill-e2e.test.ts
@@ -1886,7 +1886,7 @@ Write DESIGN.md and CLAUDE.md (or update it) in the working directory.`,
 
 This is a civic tech data platform called CivicPulse. Read the README.md.
 
-DO research competitors before proposing — search for civic tech and government data platform designs. Skip the font preview page. Skip any AskUserQuestion calls — this is non-interactive.
+DO research what's out there before proposing — search for civic tech and government data platform designs. Skip the font preview page. Skip any AskUserQuestion calls — this is non-interactive.
 
 Write DESIGN.md to the working directory.`,
       workingDirectory: designDir,
diff --git a/test/skill-validation.test.ts b/test/skill-validation.test.ts
index 54e03a4d..81d97d31 100644
--- a/test/skill-validation.test.ts
+++ b/test/skill-validation.test.ts
@@ -617,6 +617,43 @@ describe('Enum & Value Completeness in review checklist', () => {
   });
 });
 
+// --- Completeness Principle spot-check ---
+
+describe('Completeness Principle in generated SKILL.md files', () => {
+  const skillsWithPreamble = [
+    'SKILL.md', 'browse/SKILL.md', 'qa/SKILL.md',
+    'qa-only/SKILL.md',
+    'setup-browser-cookies/SKILL.md',
+    'ship/SKILL.md', 'review/SKILL.md',
+    'plan-ceo-review/SKILL.md', 'plan-eng-review/SKILL.md',
+    'retro/SKILL.md',
+    'plan-design-review/SKILL.md',
+    'qa-design-review/SKILL.md',
+    'design-consultation/SKILL.md',
+    'document-release/SKILL.md',
+  ];
+
+  for (const skill of skillsWithPreamble) {
+    test(`${skill} contains Completeness Principle section`, () => {
+      const content = fs.readFileSync(path.join(ROOT, skill), 'utf-8');
+      expect(content).toContain('Completeness Principle');
+      expect(content).toContain('Boil the Lake');
+    });
+  }
+
+  test('Completeness Principle includes compression table', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'SKILL.md'), 'utf-8');
+    expect(content).toContain('CC+gstack');
+    expect(content).toContain('Compression');
+  });
+
+  test('Completeness Principle includes anti-patterns', () => {
+    const content = fs.readFileSync(path.join(ROOT, 'SKILL.md'), 'utf-8');
+    expect(content).toContain('BAD:');
+    expect(content).toContain('Anti-patterns');
+  });
+});
+
 // --- Part 7: Planted-bug fixture validation (A4) ---
 
 describe('Planted-bug fixture validation', () => {

From 17c1c06cd98f78bf0bd25adba2effa8048a76936 Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 18:45:41 -0500
Subject: [PATCH 18/22] feat: diff-based test selection for E2E and LLM-judge
 evals (v0.6.1.0) (#139)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* feat: diff-based test selection for E2E and LLM-judge evals

Each test declares file dependencies in a TOUCHFILES map. The test runner
checks git diff against the base branch and only runs tests whose
dependencies were modified. Global touchfiles (session-runner, eval-store,
gen-skill-docs) trigger all tests.

New scripts: test:e2e:all, test:evals:all, eval:select

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* chore: bump version and changelog (v0.6.1.0)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

* fix: plan-design-review-audit eval — bump turns to 30, add efficiency hints

The test was flaky at 20 turns because the agent reads a 300-line SKILL.md,
navigates, extracts design data, and writes a report. Added hints to skip
preamble/batch commands/write early while still testing the real SKILL.md.
Now completes in ~13 turns consistently.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 CHANGELOG.md                |  13 ++
 CLAUDE.md                   |  13 +-
 VERSION                     |   2 +-
 package.json                |   5 +-
 scripts/eval-select.ts      |  86 ++++++++++++
 test/helpers/touchfiles.ts  | 178 +++++++++++++++++++++++++
 test/skill-e2e.test.ts      | 124 ++++++++++++------
 test/skill-llm-eval.test.ts |  62 +++++++--
 test/touchfiles.test.ts     | 253 ++++++++++++++++++++++++++++++++++++
 9 files changed, 681 insertions(+), 55 deletions(-)
 create mode 100644 scripts/eval-select.ts
 create mode 100644 test/helpers/touchfiles.ts
 create mode 100644 test/touchfiles.test.ts

diff --git a/CHANGELOG.md b/CHANGELOG.md
index be473577..5062711c 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,18 @@
 # Changelog
 
+## [0.6.1.0] - 2026-03-17
+
+### Added
+
+- **E2E and LLM-judge tests now only run what you changed.** Each test declares which source files it depends on. When you run `bun run test:e2e`, it checks your diff and skips tests whose dependencies weren't touched. A branch that only changes `/retro` now runs 2 tests instead of 31. Use `bun run test:e2e:all` to force everything.
+- **`bun run eval:select` previews which tests would run.** See exactly which tests your diff triggers before spending API credits. Supports `--json` for scripting and `--base <branch>` to override the base branch.
+- **Completeness guardrail catches forgotten test entries.** A free unit test validates that every `testName` in the E2E and LLM-judge test files has a corresponding entry in the TOUCHFILES map. New tests without entries fail `bun test` immediately — no silent always-run degradation.
+
+### Changed
+
+- `test:evals` and `test:e2e` now auto-select based on diff (was: all-or-nothing)
+- New `test:evals:all` and `test:e2e:all` scripts for explicit full runs
+
 ## 0.6.1 — 2026-03-17 — Boil the Lake
 
 Every gstack skill now follows the **Completeness Principle**: always recommend the
diff --git a/CLAUDE.md b/CLAUDE.md
index 34868b0a..213be490 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -5,8 +5,11 @@
 ```bash
 bun install          # install dependencies
 bun test             # run free tests (browse + snapshot + skill validation)
-bun run test:evals   # run paid evals: LLM judge + E2E (~$4/run)
-bun run test:e2e     # run E2E tests only (~$3.85/run)
+bun run test:evals   # run paid evals: LLM judge + E2E (diff-based, ~$4/run max)
+bun run test:evals:all  # run ALL paid evals regardless of diff
+bun run test:e2e     # run E2E tests only (diff-based, ~$3.85/run max)
+bun run test:e2e:all # run ALL E2E tests regardless of diff
+bun run eval:select  # show which tests would run based on current diff
 bun run dev <cmd>    # run CLI in dev mode, e.g. bun run dev goto https://example.com
 bun run build        # gen docs + compile binaries
 bun run gen:skill-docs  # regenerate SKILL.md files from templates
@@ -21,6 +24,12 @@ bun run eval:summary # aggregate stats across all eval runs
 (tool-by-tool via `--output-format stream-json --verbose`). Results are persisted
 to `~/.gstack-dev/evals/` with auto-comparison against the previous run.
 
+**Diff-based test selection:** `test:evals` and `test:e2e` auto-select tests based
+on `git diff` against the base branch. Each test declares its file dependencies in
+`test/helpers/touchfiles.ts`. Changes to global touchfiles (session-runner, eval-store,
+llm-judge, gen-skill-docs) trigger all tests. Use `EVALS_ALL=1` or the `:all` script
+variants to force all tests. Run `eval:select` to preview which tests would run.
+
 ## Project structure
 
 ```
diff --git a/VERSION b/VERSION
index ee6cdce3..44e7f9a2 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.6.1
+0.6.1.0
diff --git a/package.json b/package.json
index a5044b7d..e725b4ab 100644
--- a/package.json
+++ b/package.json
@@ -14,14 +14,17 @@
     "server": "bun run browse/src/server.ts",
     "test": "bun test browse/test/ test/ --ignore test/skill-e2e.test.ts --ignore test/skill-llm-eval.test.ts",
     "test:evals": "EVALS=1 bun test test/skill-llm-eval.test.ts test/skill-e2e.test.ts",
+    "test:evals:all": "EVALS=1 EVALS_ALL=1 bun test test/skill-llm-eval.test.ts test/skill-e2e.test.ts",
     "test:e2e": "EVALS=1 bun test test/skill-e2e.test.ts",
+    "test:e2e:all": "EVALS=1 EVALS_ALL=1 bun test test/skill-e2e.test.ts",
     "skill:check": "bun run scripts/skill-check.ts",
     "dev:skill": "bun run scripts/dev-skill.ts",
     "start": "bun run browse/src/server.ts",
     "eval:list": "bun run scripts/eval-list.ts",
     "eval:compare": "bun run scripts/eval-compare.ts",
     "eval:summary": "bun run scripts/eval-summary.ts",
-    "eval:watch": "bun run scripts/eval-watch.ts"
+    "eval:watch": "bun run scripts/eval-watch.ts",
+    "eval:select": "bun run scripts/eval-select.ts"
   },
   "dependencies": {
     "playwright": "^1.58.2",
diff --git a/scripts/eval-select.ts b/scripts/eval-select.ts
new file mode 100644
index 00000000..cdbdcc84
--- /dev/null
+++ b/scripts/eval-select.ts
@@ -0,0 +1,86 @@
+#!/usr/bin/env bun
+/**
+ * Show which E2E and LLM-judge tests would run based on the current git diff.
+ *
+ * Usage:
+ *   bun run eval:select              # human-readable output
+ *   bun run eval:select --json       # machine-readable JSON
+ *   bun run eval:select --base main  # override base branch
+ */
+
+import * as path from 'path';
+import {
+  selectTests,
+  detectBaseBranch,
+  getChangedFiles,
+  E2E_TOUCHFILES,
+  LLM_JUDGE_TOUCHFILES,
+  GLOBAL_TOUCHFILES,
+} from '../test/helpers/touchfiles';
+
+const ROOT = path.resolve(import.meta.dir, '..');
+const args = process.argv.slice(2);
+const jsonMode = args.includes('--json');
+const baseIdx = args.indexOf('--base');
+const baseOverride = baseIdx >= 0 ? args[baseIdx + 1] : undefined;
+
+// Detect base branch
+const baseBranch = baseOverride || detectBaseBranch(ROOT) || 'main';
+const changedFiles = getChangedFiles(baseBranch, ROOT);
+
+if (changedFiles.length === 0) {
+  if (jsonMode) {
+    console.log(JSON.stringify({ base: baseBranch, changed_files: 0, e2e: 'all', llm_judge: 'all', reason: 'no diff — would run all tests' }));
+  } else {
+    console.log(`Base: ${baseBranch}`);
+    console.log('No changed files detected — all tests would run.');
+  }
+  process.exit(0);
+}
+
+const e2eSelection = selectTests(changedFiles, E2E_TOUCHFILES, GLOBAL_TOUCHFILES);
+const llmSelection = selectTests(changedFiles, LLM_JUDGE_TOUCHFILES, GLOBAL_TOUCHFILES);
+
+if (jsonMode) {
+  console.log(JSON.stringify({
+    base: baseBranch,
+    changed_files: changedFiles,
+    e2e: {
+      selected: e2eSelection.selected,
+      skipped: e2eSelection.skipped,
+      reason: e2eSelection.reason,
+      count: `${e2eSelection.selected.length}/${Object.keys(E2E_TOUCHFILES).length}`,
+    },
+    llm_judge: {
+      selected: llmSelection.selected,
+      skipped: llmSelection.skipped,
+      reason: llmSelection.reason,
+      count: `${llmSelection.selected.length}/${Object.keys(LLM_JUDGE_TOUCHFILES).length}`,
+    },
+  }, null, 2));
+} else {
+  console.log(`Base: ${baseBranch}`);
+  console.log(`Changed files: ${changedFiles.length}`);
+  console.log();
+
+  console.log(`E2E (${e2eSelection.reason}): ${e2eSelection.selected.length}/${Object.keys(E2E_TOUCHFILES).length} tests`);
+  if (e2eSelection.selected.length > 0 && e2eSelection.selected.length < Object.keys(E2E_TOUCHFILES).length) {
+    console.log(`  Selected: ${e2eSelection.selected.join(', ')}`);
+    console.log(`  Skipped:  ${e2eSelection.skipped.join(', ')}`);
+  } else if (e2eSelection.selected.length === 0) {
+    console.log('  No E2E tests affected.');
+  } else {
+    console.log('  All E2E tests selected.');
+  }
+  console.log();
+
+  console.log(`LLM-judge (${llmSelection.reason}): ${llmSelection.selected.length}/${Object.keys(LLM_JUDGE_TOUCHFILES).length} tests`);
+  if (llmSelection.selected.length > 0 && llmSelection.selected.length < Object.keys(LLM_JUDGE_TOUCHFILES).length) {
+    console.log(`  Selected: ${llmSelection.selected.join(', ')}`);
+    console.log(`  Skipped:  ${llmSelection.skipped.join(', ')}`);
+  } else if (llmSelection.selected.length === 0) {
+    console.log('  No LLM-judge tests affected.');
+  } else {
+    console.log('  All LLM-judge tests selected.');
+  }
+}
diff --git a/test/helpers/touchfiles.ts b/test/helpers/touchfiles.ts
new file mode 100644
index 00000000..30a15579
--- /dev/null
+++ b/test/helpers/touchfiles.ts
@@ -0,0 +1,178 @@
+/**
+ * Diff-based test selection for E2E and LLM-judge evals.
+ *
+ * Each test declares which source files it depends on ("touchfiles").
+ * The test runner checks `git diff` and only runs tests whose
+ * dependencies were modified. Override with EVALS_ALL=1 to run everything.
+ */
+
+import { spawnSync } from 'child_process';
+
+// --- Glob matching ---
+
+/**
+ * Match a file path against a glob pattern.
+ * Supports:
+ *   ** — match any number of path segments
+ *   *  — match within a single segment (no /)
+ */
+export function matchGlob(file: string, pattern: string): boolean {
+  const regexStr = pattern
+    .replace(/\./g, '\\.')
+    .replace(/\*\*/g, '{{GLOBSTAR}}')
+    .replace(/\*/g, '[^/]*')
+    .replace(/\{\{GLOBSTAR\}\}/g, '.*');
+  return new RegExp(`^${regexStr}$`).test(file);
+}
+
+// --- Touchfile maps ---
+
+/**
+ * E2E test touchfiles — keyed by testName (the string passed to runSkillTest).
+ * Each test lists the file patterns that, if changed, require the test to run.
+ */
+export const E2E_TOUCHFILES: Record<string, string[]> = {
+  // Browse core
+  'browse-basic':    ['browse/src/**'],
+  'browse-snapshot': ['browse/src/**'],
+
+  // SKILL.md setup + preamble (depend on ROOT SKILL.md only)
+  'skillmd-setup-discovery':  ['SKILL.md', 'SKILL.md.tmpl'],
+  'skillmd-no-local-binary':  ['SKILL.md', 'SKILL.md.tmpl'],
+  'skillmd-outside-git':      ['SKILL.md', 'SKILL.md.tmpl'],
+  'contributor-mode':         ['SKILL.md', 'SKILL.md.tmpl'],
+  'session-awareness':        ['SKILL.md', 'SKILL.md.tmpl'],
+
+  // QA
+  'qa-quick':       ['qa/**', 'browse/src/**'],
+  'qa-b6-static':   ['qa/**', 'browse/src/**', 'browse/test/fixtures/qa-eval.html', 'test/fixtures/qa-eval-ground-truth.json'],
+  'qa-b7-spa':      ['qa/**', 'browse/src/**', 'browse/test/fixtures/qa-eval-spa.html', 'test/fixtures/qa-eval-spa-ground-truth.json'],
+  'qa-b8-checkout': ['qa/**', 'browse/src/**', 'browse/test/fixtures/qa-eval-checkout.html', 'test/fixtures/qa-eval-checkout-ground-truth.json'],
+  'qa-only-no-fix': ['qa-only/**', 'qa/templates/**'],
+  'qa-fix-loop':    ['qa/**', 'browse/src/**'],
+
+  // Review
+  'review-sql-injection':     ['review/**', 'test/fixtures/review-eval-vuln.rb'],
+  'review-enum-completeness': ['review/**', 'test/fixtures/review-eval-enum*.rb'],
+  'review-base-branch':       ['review/**'],
+
+  // Plan reviews
+  'plan-ceo-review':           ['plan-ceo-review/**'],
+  'plan-ceo-review-selective': ['plan-ceo-review/**'],
+  'plan-eng-review':           ['plan-eng-review/**'],
+  'plan-eng-review-artifact':  ['plan-eng-review/**'],
+
+  // Ship
+  'ship-base-branch': ['ship/**'],
+
+  // Retro
+  'retro':             ['retro/**'],
+  'retro-base-branch': ['retro/**'],
+
+  // Document-release
+  'document-release': ['document-release/**'],
+
+  // QA bootstrap
+  'qa-bootstrap': ['qa/**', 'browse/src/**', 'ship/**'],
+
+  // Ship coverage audit
+  'ship-coverage-audit': ['ship/**'],
+
+  // Design
+  'design-consultation-core':     ['design-consultation/**'],
+  'design-consultation-research': ['design-consultation/**'],
+  'design-consultation-existing': ['design-consultation/**'],
+  'design-consultation-preview':  ['design-consultation/**'],
+  'plan-design-review-audit':     ['plan-design-review/**'],
+  'plan-design-review-export':    ['plan-design-review/**'],
+  'qa-design-review-fix':         ['qa-design-review/**', 'browse/src/**'],
+};
+
+/**
+ * LLM-judge test touchfiles — keyed by test description string.
+ */
+export const LLM_JUDGE_TOUCHFILES: Record<string, string[]> = {
+  'command reference table':          ['SKILL.md', 'SKILL.md.tmpl', 'browse/src/commands.ts'],
+  'snapshot flags reference':         ['SKILL.md', 'SKILL.md.tmpl', 'browse/src/snapshot.ts'],
+  'browse/SKILL.md reference':        ['browse/SKILL.md', 'browse/SKILL.md.tmpl', 'browse/src/**'],
+  'setup block':                      ['SKILL.md', 'SKILL.md.tmpl'],
+  'regression vs baseline':           ['SKILL.md', 'SKILL.md.tmpl', 'browse/src/commands.ts', 'test/fixtures/eval-baselines.json'],
+  'qa/SKILL.md workflow':             ['qa/SKILL.md', 'qa/SKILL.md.tmpl'],
+  'qa/SKILL.md health rubric':        ['qa/SKILL.md', 'qa/SKILL.md.tmpl'],
+  'cross-skill greptile consistency': ['review/SKILL.md', 'review/SKILL.md.tmpl', 'ship/SKILL.md', 'ship/SKILL.md.tmpl', 'review/greptile-triage.md', 'retro/SKILL.md', 'retro/SKILL.md.tmpl'],
+  'baseline score pinning':           ['SKILL.md', 'SKILL.md.tmpl', 'test/fixtures/eval-baselines.json'],
+};
+
+/**
+ * Changes to any of these files trigger ALL tests (both E2E and LLM-judge).
+ */
+export const GLOBAL_TOUCHFILES = [
+  'test/helpers/session-runner.ts',
+  'test/helpers/eval-store.ts',
+  'test/helpers/llm-judge.ts',
+  'scripts/gen-skill-docs.ts',
+  'test/helpers/touchfiles.ts',
+  'browse/test/test-server.ts',
+];
+
+// --- Base branch detection ---
+
+/**
+ * Detect the base branch by trying refs in order.
+ * Returns the first valid ref, or null if none found.
+ */
+export function detectBaseBranch(cwd: string): string | null {
+  for (const ref of ['origin/main', 'origin/master', 'main', 'master']) {
+    const result = spawnSync('git', ['rev-parse', '--verify', ref], {
+      cwd, stdio: 'pipe', timeout: 3000,
+    });
+    if (result.status === 0) return ref;
+  }
+  return null;
+}
+
+/**
+ * Get list of files changed between base branch and HEAD.
+ */
+export function getChangedFiles(baseBranch: string, cwd: string): string[] {
+  const result = spawnSync('git', ['diff', '--name-only', `${baseBranch}...HEAD`], {
+    cwd, stdio: 'pipe', timeout: 5000,
+  });
+  if (result.status !== 0) return [];
+  return result.stdout.toString().trim().split('\n').filter(Boolean);
+}
+
+// --- Test selection ---
+
+/**
+ * Select tests to run based on changed files.
+ *
+ * Algorithm:
+ * 1. If any changed file matches a global touchfile → run ALL tests
+ * 2. Otherwise, for each test, check if any changed file matches its patterns
+ * 3. Return selected + skipped lists with reason
+ */
+export function selectTests(
+  changedFiles: string[],
+  touchfiles: Record<string, string[]>,
+  globalTouchfiles: string[] = GLOBAL_TOUCHFILES,
+): { selected: string[]; skipped: string[]; reason: string } {
+  const allTestNames = Object.keys(touchfiles);
+
+  // Global touchfile hit → run all
+  for (const file of changedFiles) {
+    if (globalTouchfiles.some(g => matchGlob(file, g))) {
+      return { selected: allTestNames, skipped: [], reason: `global: ${file}` };
+    }
+  }
+
+  // Per-test matching
+  const selected: string[] = [];
+  const skipped: string[] = [];
+  for (const [testName, patterns] of Object.entries(touchfiles)) {
+    const hit = changedFiles.some(f => patterns.some(p => matchGlob(f, p)));
+    (hit ? selected : skipped).push(testName);
+  }
+
+  return { selected, skipped, reason: 'diff' };
+}
diff --git a/test/skill-e2e.test.ts b/test/skill-e2e.test.ts
index 021e41da..338ec2f1 100644
--- a/test/skill-e2e.test.ts
+++ b/test/skill-e2e.test.ts
@@ -1,10 +1,11 @@
 import { describe, test, expect, beforeAll, afterAll } from 'bun:test';
 import { runSkillTest } from './helpers/session-runner';
 import type { SkillTestResult } from './helpers/session-runner';
-import { outcomeJudge } from './helpers/llm-judge';
+import { outcomeJudge, callJudge } from './helpers/llm-judge';
 import { EvalCollector, judgePassed } from './helpers/eval-store';
 import type { EvalTestEntry } from './helpers/eval-store';
 import { startTestServer } from '../browse/test/test-server';
+import { selectTests, detectBaseBranch, getChangedFiles, E2E_TOUCHFILES, GLOBAL_TOUCHFILES } from './helpers/touchfiles';
 import { spawnSync } from 'child_process';
 import * as fs from 'fs';
 import * as path from 'path';
@@ -21,6 +22,41 @@ const ROOT = path.resolve(import.meta.dir, '..');
 const evalsEnabled = !!process.env.EVALS;
 const describeE2E = evalsEnabled ? describe : describe.skip;
 
+// --- Diff-based test selection ---
+// When EVALS_ALL is not set, only run tests whose touchfiles were modified.
+// Set EVALS_ALL=1 to force all tests. Set EVALS_BASE to override base branch.
+let selectedTests: string[] | null = null; // null = run all
+
+if (evalsEnabled && !process.env.EVALS_ALL) {
+  const baseBranch = process.env.EVALS_BASE
+    || detectBaseBranch(ROOT)
+    || 'main';
+  const changedFiles = getChangedFiles(baseBranch, ROOT);
+
+  if (changedFiles.length > 0) {
+    const selection = selectTests(changedFiles, E2E_TOUCHFILES, GLOBAL_TOUCHFILES);
+    selectedTests = selection.selected;
+    process.stderr.write(`\nE2E selection (${selection.reason}): ${selection.selected.length}/${Object.keys(E2E_TOUCHFILES).length} tests\n`);
+    if (selection.skipped.length > 0) {
+      process.stderr.write(`  Skipped: ${selection.skipped.join(', ')}\n`);
+    }
+    process.stderr.write('\n');
+  }
+  // If changedFiles is empty (e.g., on main branch), selectedTests stays null → run all
+}
+
+/** Wrap a describe block to skip entirely if none of its tests are selected. */
+function describeIfSelected(name: string, testNames: string[], fn: () => void) {
+  const anySelected = selectedTests === null || testNames.some(t => selectedTests!.includes(t));
+  (anySelected ? describeE2E : describe.skip)(name, fn);
+}
+
+/** Skip an individual test if not selected (for multi-test describe blocks). */
+function testIfSelected(testName: string, fn: () => Promise<void>, timeout: number) {
+  const shouldRun = selectedTests === null || selectedTests.includes(testName);
+  (shouldRun ? test : test.skip)(testName, fn, timeout);
+}
+
 // Eval result collector — accumulates test results, writes to ~/.gstack-dev/evals/ on finalize
 const evalCollector = evalsEnabled ? new EvalCollector('e2e') : null;
 
@@ -133,7 +169,10 @@ if (evalsEnabled) {
   }
 }
 
-describeE2E('Skill E2E tests', () => {
+describeIfSelected('Skill E2E tests', [
+  'browse-basic', 'browse-snapshot', 'skillmd-setup-discovery',
+  'skillmd-no-local-binary', 'skillmd-outside-git', 'contributor-mode', 'session-awareness',
+], () => {
   beforeAll(() => {
     testServer = startTestServer();
     tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-'));
@@ -145,7 +184,7 @@ describeE2E('Skill E2E tests', () => {
     try { fs.rmSync(tmpDir, { recursive: true, force: true }); } catch {}
   });
 
-  test('browse basic commands work without errors', async () => {
+  testIfSelected('browse-basic', async () => {
     const result = await runSkillTest({
       prompt: `You have a browse binary at ${browseBin}. Assign it to B variable and run these commands in sequence:
 1. $B goto ${testServer.url}
@@ -166,7 +205,7 @@ Report the results of each command.`,
     expect(result.exitReason).toBe('success');
   }, 90_000);
 
-  test('browse snapshot flags all work', async () => {
+  testIfSelected('browse-snapshot', async () => {
     const result = await runSkillTest({
       prompt: `You have a browse binary at ${browseBin}. Assign it to B variable and run:
 1. $B goto ${testServer.url}
@@ -191,7 +230,7 @@ Report what each command returned.`,
     expect(result.exitReason).toBe('success');
   }, 90_000);
 
-  test('agent discovers browse binary via SKILL.md setup block', async () => {
+  testIfSelected('skillmd-setup-discovery', async () => {
     const skillMd = fs.readFileSync(path.join(ROOT, 'SKILL.md'), 'utf-8');
     const setupStart = skillMd.indexOf('## SETUP');
     const setupEnd = skillMd.indexOf('## IMPORTANT');
@@ -220,7 +259,7 @@ Report whether it worked.`,
     expect(result.exitReason).toBe('success');
   }, 90_000);
 
-  test('SKILL.md setup block handles missing local binary gracefully', async () => {
+  testIfSelected('skillmd-no-local-binary', async () => {
     // Create a tmpdir with no browse binary — no local .claude/skills/gstack/browse/dist/browse
     const emptyDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-empty-'));
 
@@ -255,7 +294,7 @@ Report the exact output. Do NOT try to fix or install anything — just report w
     try { fs.rmSync(emptyDir, { recursive: true, force: true }); } catch {}
   }, 60_000);
 
-  test('SKILL.md setup block works outside git repo', async () => {
+  testIfSelected('skillmd-outside-git', async () => {
     // Create a tmpdir outside any git repo
     const nonGitDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-nogit-'));
 
@@ -286,7 +325,7 @@ Report the exact output — either "READY: <path>" or "NEEDS_SETUP".`,
     try { fs.rmSync(nonGitDir, { recursive: true, force: true }); } catch {}
   }, 60_000);
 
-  test('contributor mode files a report on gstack error', async () => {
+  testIfSelected('contributor-mode', async () => {
     const contribDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-contrib-'));
     const logsDir = path.join(contribDir, 'contributor-logs');
     fs.mkdirSync(logsDir, { recursive: true });
@@ -342,7 +381,7 @@ File a contributor report about this issue. Then tell me what you filed.`,
     try { fs.rmSync(contribDir, { recursive: true, force: true }); } catch {}
   }, 90_000);
 
-  test('session awareness adds ELI16 context when _SESSIONS >= 3', async () => {
+  testIfSelected('session-awareness', async () => {
     const sessionDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-session-'));
 
     // Set up a git repo so there's project/branch context to reference
@@ -413,7 +452,7 @@ Remember: _SESSIONS=4, so ELI16 mode is active. The user is juggling multiple wi
 
 // --- B4: QA skill E2E ---
 
-describeE2E('QA skill E2E', () => {
+describeIfSelected('QA skill E2E', ['qa-quick'], () => {
   let qaDir: string;
 
   beforeAll(() => {
@@ -468,7 +507,7 @@ Write your report to ${qaDir}/qa-reports/qa-report.md`,
 
 // --- B5: Review skill E2E ---
 
-describeE2E('Review skill E2E', () => {
+describeIfSelected('Review skill E2E', ['review-sql-injection'], () => {
   let reviewDir: string;
 
   beforeAll(() => {
@@ -527,7 +566,7 @@ Write your review findings to ${reviewDir}/review-output.md`,
 
 // --- Review: Enum completeness E2E ---
 
-describeE2E('Review enum completeness E2E', () => {
+describeIfSelected('Review enum completeness E2E', ['review-enum-completeness'], () => {
   let enumDir: string;
 
   beforeAll(() => {
@@ -603,7 +642,10 @@ The diff adds a new "returned" status to the Order model. Your job is to check i
 const hasApiKey = !!process.env.ANTHROPIC_API_KEY;
 const describeOutcome = (evalsEnabled && hasApiKey) ? describe : describe.skip;
 
-describeOutcome('Planted-bug outcome evals', () => {
+// Wrap describeOutcome with selection — skip if no planted-bug tests are selected
+const outcomeTestNames = ['qa-b6-static', 'qa-b7-spa', 'qa-b8-checkout'];
+const anyOutcomeSelected = selectedTests === null || outcomeTestNames.some(t => selectedTests!.includes(t));
+(anyOutcomeSelected ? describeOutcome : describe.skip)('Planted-bug outcome evals', () => {
   let outcomeDir: string;
 
   beforeAll(() => {
@@ -767,7 +809,7 @@ CRITICAL RULES:
 
 // --- Plan CEO Review E2E ---
 
-describeE2E('Plan CEO Review E2E', () => {
+describeIfSelected('Plan CEO Review E2E', ['plan-ceo-review'], () => {
   let planDir: string;
 
   beforeAll(() => {
@@ -854,7 +896,7 @@ Focus on reviewing the plan content: architecture, error handling, security, and
 
 // --- Plan CEO Review (SELECTIVE EXPANSION) E2E ---
 
-describeE2E('Plan CEO Review SELECTIVE EXPANSION E2E', () => {
+describeIfSelected('Plan CEO Review SELECTIVE EXPANSION E2E', ['plan-ceo-review-selective'], () => {
   let planDir: string;
 
   beforeAll(() => {
@@ -937,7 +979,7 @@ Focus on reviewing the plan content: architecture, error handling, security, and
 
 // --- Plan Eng Review E2E ---
 
-describeE2E('Plan Eng Review E2E', () => {
+describeIfSelected('Plan Eng Review E2E', ['plan-eng-review'], () => {
   let planDir: string;
 
   beforeAll(() => {
@@ -1031,7 +1073,7 @@ Focus on architecture, code quality, tests, and performance sections.`,
 
 // --- Retro E2E ---
 
-describeE2E('Retro E2E', () => {
+describeIfSelected('Retro E2E', ['retro'], () => {
   let retroDir: string;
 
   beforeAll(() => {
@@ -1117,7 +1159,7 @@ Analyze the git history and produce the narrative report as described in the SKI
 
 // --- QA-Only E2E (report-only, no fixes) ---
 
-describeE2E('QA-Only skill E2E', () => {
+describeIfSelected('QA-Only skill E2E', ['qa-only-no-fix'], () => {
   let qaOnlyDir: string;
 
   beforeAll(() => {
@@ -1203,7 +1245,7 @@ Write your report to ${qaOnlyDir}/qa-reports/qa-only-report.md`,
 
 // --- QA Fix Loop E2E ---
 
-describeE2E('QA Fix Loop E2E', () => {
+describeIfSelected('QA Fix Loop E2E', ['qa-fix-loop'], () => {
   let qaFixDir: string;
   let qaFixServer: ReturnType<typeof Bun.serve> | null = null;
 
@@ -1317,7 +1359,7 @@ This is a test+fix loop: find bugs, fix them in the source code, commit each fix
 
 // --- Plan-Eng-Review Test-Plan Artifact E2E ---
 
-describeE2E('Plan-Eng-Review Test-Plan Artifact E2E', () => {
+describeIfSelected('Plan-Eng-Review Test-Plan Artifact E2E', ['plan-eng-review-artifact'], () => {
   let planDir: string;
   let projectDir: string;
 
@@ -1444,7 +1486,7 @@ Write your review to ${planDir}/review-output.md`,
 
 // --- Base branch detection smoke tests ---
 
-describeE2E('Base branch detection', () => {
+describeIfSelected('Base branch detection', ['review-base-branch', 'ship-base-branch', 'retro-base-branch'], () => {
   let baseBranchDir: string;
   const run = (cmd: string, args: string[], cwd: string) =>
     spawnSync(cmd, args, { cwd, stdio: 'pipe', timeout: 5000 });
@@ -1457,7 +1499,7 @@ describeE2E('Base branch detection', () => {
     try { fs.rmSync(baseBranchDir, { recursive: true, force: true }); } catch {}
   });
 
-  test('/review detects base branch and diffs against it', async () => {
+  testIfSelected('review-base-branch', async () => {
     const dir = path.join(baseBranchDir, 'review-base');
     fs.mkdirSync(dir, { recursive: true });
 
@@ -1510,7 +1552,7 @@ Write your findings to ${dir}/review-output.md`,
     expect(usedGitDiff).toBe(true);
   }, 120_000);
 
-  test('/ship Step 0-1 detects base branch without destructive actions', async () => {
+  testIfSelected('ship-base-branch', async () => {
     const dir = path.join(baseBranchDir, 'ship-base');
     fs.mkdirSync(dir, { recursive: true });
 
@@ -1572,7 +1614,7 @@ Write a summary of what you detected to ${dir}/ship-preflight.md including:
     expect(destructiveTools).toHaveLength(0);
   }, 90_000);
 
-  test('/retro detects default branch for git queries', async () => {
+  testIfSelected('retro-base-branch', async () => {
     const dir = path.join(baseBranchDir, 'retro-base');
     fs.mkdirSync(dir, { recursive: true });
 
@@ -1631,7 +1673,7 @@ Write your retrospective to ${dir}/retro-output.md`,
 
 // --- Document-Release skill E2E ---
 
-describeE2E('Document-Release skill E2E', () => {
+describeIfSelected('Document-Release skill E2E', ['document-release'], () => {
   let docReleaseDir: string;
 
   beforeAll(() => {
@@ -1735,6 +1777,7 @@ IMPORTANT:
 
 // --- Deferred skill E2E tests (destructive or require interactive UI) ---
 
+// Deferred tests — only test.todo entries, no selection needed
 describeE2E('Deferred skill E2E', () => {
   // Ship is destructive: pushes to remote, creates PRs, modifies VERSION/CHANGELOG
   test.todo('/ship completes full workflow');
@@ -1772,7 +1815,10 @@ ${designMd}
 Return JSON: { "passed": true/false, "reasoning": "one paragraph explaining your evaluation" }`);
 }
 
-describeE2E('Design Consultation E2E', () => {
+describeIfSelected('Design Consultation E2E', [
+  'design-consultation-core', 'design-consultation-research',
+  'design-consultation-existing', 'design-consultation-preview',
+], () => {
   let designDir: string;
 
   beforeAll(() => {
@@ -1816,7 +1862,7 @@ A civic tech data platform for government employees to access, visualize, and sh
     try { fs.rmSync(designDir, { recursive: true, force: true }); } catch {}
   });
 
-  test('Test 1: core flow produces valid DESIGN.md + CLAUDE.md', async () => {
+  testIfSelected('design-consultation-core', async () => {
     const result = await runSkillTest({
       prompt: `Read design-consultation/SKILL.md for the design consultation workflow.
 
@@ -1876,7 +1922,7 @@ Write DESIGN.md and CLAUDE.md (or update it) in the working directory.`,
     }
   }, 420_000);
 
-  test('Test 2: research integration uses WebSearch', async () => {
+  testIfSelected('design-consultation-research', async () => {
     // Clean up from previous test
     try { fs.unlinkSync(path.join(designDir, 'DESIGN.md')); } catch {}
     try { fs.unlinkSync(path.join(designDir, 'CLAUDE.md')); } catch {}
@@ -1933,7 +1979,7 @@ Write DESIGN.md to the working directory.`,
     expect(designExists).toBe(true);
   }, 420_000);
 
-  test('Test 3: handles existing DESIGN.md', async () => {
+  testIfSelected('design-consultation-existing', async () => {
     // Pre-create a minimal DESIGN.md
     fs.writeFileSync(path.join(designDir, 'DESIGN.md'), `# Design System — CivicPulse
 
@@ -1979,7 +2025,7 @@ Skip research. Skip font preview. Skip any AskUserQuestion calls — this is non
     }
   }, 420_000);
 
-  test('Test 4: generates font + color preview HTML', async () => {
+  testIfSelected('design-consultation-preview', async () => {
     // Clean up
     try { fs.unlinkSync(path.join(designDir, 'DESIGN.md')); } catch {}
 
@@ -2043,7 +2089,7 @@ Skip research. Skip any AskUserQuestion calls — this is non-interactive. Gener
 
 // --- Plan Design Review E2E ---
 
-describeE2E('Plan Design Review E2E', () => {
+describeIfSelected('Plan Design Review E2E', ['plan-design-review-audit', 'plan-design-review-export'], () => {
   let reviewDir: string;
 
   beforeAll(() => {
@@ -2074,7 +2120,7 @@ describeE2E('Plan Design Review E2E', () => {
     try { fs.rmSync(reviewDir, { recursive: true, force: true }); } catch {}
   });
 
-  test('Test 5: /plan-design-review produces audit report', async () => {
+  testIfSelected('plan-design-review-audit', async () => {
     const result = await runSkillTest({
       prompt: `IMPORTANT: The browse binary is already assigned below as B. Do NOT search for it or run the SKILL.md setup block — just use $B directly.
 
@@ -2082,9 +2128,11 @@ B="${browseBin}"
 
 Read plan-design-review/SKILL.md for the design review workflow.
 
-Review the site at ${testServer.url}. Use --quick mode (homepage + 2 pages). Skip any AskUserQuestion calls — this is non-interactive. Write your audit report to ./design-audit.md. Do not offer to create DESIGN.md.`,
+Review the site at ${testServer.url}. Use --quick mode (homepage + 2 pages). Skip any AskUserQuestion calls — this is non-interactive. Write your audit report to ./design-audit.md. Do not offer to create DESIGN.md.
+
+EFFICIENCY: Skip the preamble bash block. Combine multiple browse commands into single bash blocks (e.g. run all Phase 2 JS extractions in one block). Write the report as soon as you have enough data — do not over-explore.`,
       workingDirectory: reviewDir,
-      maxTurns: 20,
+      maxTurns: 30,
       timeout: 360_000,
       testName: 'plan-design-review-audit',
       runId,
@@ -2113,7 +2161,7 @@ Review the site at ${testServer.url}. Use --quick mode (homepage + 2 pages). Ski
     }
   }, 420_000);
 
-  test('Test 6: /plan-design-review exports DESIGN.md', async () => {
+  testIfSelected('plan-design-review-export', async () => {
     // Clean up previous test artifacts
     try { fs.unlinkSync(path.join(reviewDir, 'design-audit.md')); } catch {}
 
@@ -2161,7 +2209,7 @@ Review ${testServer.url} with --quick mode. Skip any AskUserQuestion calls — t
 
 // --- QA Design Review E2E ---
 
-describeE2E('QA Design Review E2E', () => {
+describeIfSelected('QA Design Review E2E', ['qa-design-review-fix'], () => {
   let qaDesignDir: string;
   let qaDesignServer: ReturnType<typeof Bun.serve> | null = null;
 
@@ -2300,7 +2348,7 @@ Review the site at ${serverUrl}. Use --quick mode. Skip any AskUserQuestion call
 
 // --- Test Bootstrap E2E ---
 
-describeE2E('Test Bootstrap E2E', () => {
+describeIfSelected('Test Bootstrap E2E', ['qa-bootstrap'], () => {
   let bootstrapDir: string;
   let bootstrapServer: ReturnType<typeof Bun.serve>;
 
@@ -2437,7 +2485,7 @@ This is a test+fix loop: find bugs, fix them, write regression tests, commit eac
 
 // --- Test Coverage Audit E2E ---
 
-describeE2E('Test Coverage Audit E2E', () => {
+describeIfSelected('Test Coverage Audit E2E', ['ship-coverage-audit'], () => {
   let coverageDir: string;
 
   beforeAll(() => {
diff --git a/test/skill-llm-eval.test.ts b/test/skill-llm-eval.test.ts
index ba635613..c3e1aef2 100644
--- a/test/skill-llm-eval.test.ts
+++ b/test/skill-llm-eval.test.ts
@@ -17,6 +17,7 @@ import * as path from 'path';
 import { callJudge, judge } from './helpers/llm-judge';
 import type { JudgeScore } from './helpers/llm-judge';
 import { EvalCollector } from './helpers/eval-store';
+import { selectTests, detectBaseBranch, getChangedFiles, LLM_JUDGE_TOUCHFILES, GLOBAL_TOUCHFILES } from './helpers/touchfiles';
 
 const ROOT = path.resolve(import.meta.dir, '..');
 // Run when EVALS=1 is set (requires ANTHROPIC_API_KEY in env)
@@ -26,8 +27,43 @@ const describeEval = evalsEnabled ? describe : describe.skip;
 // Eval result collector
 const evalCollector = evalsEnabled ? new EvalCollector('llm-judge') : null;
 
-describeEval('LLM-as-judge quality evals', () => {
-  test('command reference table scores >= 4 on all dimensions', async () => {
+// --- Diff-based test selection ---
+let selectedTests: string[] | null = null;
+
+if (evalsEnabled && !process.env.EVALS_ALL) {
+  const baseBranch = process.env.EVALS_BASE
+    || detectBaseBranch(ROOT)
+    || 'main';
+  const changedFiles = getChangedFiles(baseBranch, ROOT);
+
+  if (changedFiles.length > 0) {
+    const selection = selectTests(changedFiles, LLM_JUDGE_TOUCHFILES, GLOBAL_TOUCHFILES);
+    selectedTests = selection.selected;
+    process.stderr.write(`\nLLM-judge selection (${selection.reason}): ${selection.selected.length}/${Object.keys(LLM_JUDGE_TOUCHFILES).length} tests\n`);
+    if (selection.skipped.length > 0) {
+      process.stderr.write(`  Skipped: ${selection.skipped.join(', ')}\n`);
+    }
+    process.stderr.write('\n');
+  }
+}
+
+/** Wrap a describe block to skip if none of its tests are selected. */
+function describeIfSelected(name: string, testNames: string[], fn: () => void) {
+  const anySelected = selectedTests === null || testNames.some(t => selectedTests!.includes(t));
+  (anySelected ? describeEval : describe.skip)(name, fn);
+}
+
+/** Skip an individual test if not selected (for multi-test describe blocks). */
+function testIfSelected(testName: string, fn: () => Promise<void>, timeout: number) {
+  const shouldRun = selectedTests === null || selectedTests.includes(testName);
+  (shouldRun ? test : test.skip)(testName, fn, timeout);
+}
+
+describeIfSelected('LLM-as-judge quality evals', [
+  'command reference table', 'snapshot flags reference',
+  'browse/SKILL.md reference', 'setup block', 'regression vs baseline',
+], () => {
+  testIfSelected('command reference table', async () => {
     const t0 = Date.now();
     const content = fs.readFileSync(path.join(ROOT, 'SKILL.md'), 'utf-8');
     const start = content.indexOf('## Command Reference');
@@ -53,7 +89,7 @@ describeEval('LLM-as-judge quality evals', () => {
     expect(scores.actionability).toBeGreaterThanOrEqual(4);
   }, 30_000);
 
-  test('snapshot flags section scores >= 4 on all dimensions', async () => {
+  testIfSelected('snapshot flags reference', async () => {
     const t0 = Date.now();
     const content = fs.readFileSync(path.join(ROOT, 'SKILL.md'), 'utf-8');
     const start = content.indexOf('## Snapshot System');
@@ -79,7 +115,7 @@ describeEval('LLM-as-judge quality evals', () => {
     expect(scores.actionability).toBeGreaterThanOrEqual(4);
   }, 30_000);
 
-  test('browse/SKILL.md overall scores >= 4', async () => {
+  testIfSelected('browse/SKILL.md reference', async () => {
     const t0 = Date.now();
     const content = fs.readFileSync(path.join(ROOT, 'browse', 'SKILL.md'), 'utf-8');
     const start = content.indexOf('## Snapshot Flags');
@@ -104,7 +140,7 @@ describeEval('LLM-as-judge quality evals', () => {
     expect(scores.actionability).toBeGreaterThanOrEqual(4);
   }, 30_000);
 
-  test('setup block scores >= 3 on actionability and clarity', async () => {
+  testIfSelected('setup block', async () => {
     const t0 = Date.now();
     const content = fs.readFileSync(path.join(ROOT, 'SKILL.md'), 'utf-8');
     const setupStart = content.indexOf('## SETUP');
@@ -131,7 +167,7 @@ describeEval('LLM-as-judge quality evals', () => {
     expect(scores.clarity).toBeGreaterThanOrEqual(3);
   }, 30_000);
 
-  test('regression check: compare branch vs baseline quality', async () => {
+  testIfSelected('regression vs baseline', async () => {
     const t0 = Date.now();
     const generated = fs.readFileSync(path.join(ROOT, 'SKILL.md'), 'utf-8');
     const genStart = generated.indexOf('## Command Reference');
@@ -220,10 +256,10 @@ Scores are 1-5 overall quality.`,
 
 // --- Part 7: QA skill quality evals (C6) ---
 
-describeEval('QA skill quality evals', () => {
+describeIfSelected('QA skill quality evals', ['qa/SKILL.md workflow', 'qa/SKILL.md health rubric'], () => {
   const qaContent = fs.readFileSync(path.join(ROOT, 'qa', 'SKILL.md'), 'utf-8');
 
-  test('qa/SKILL.md workflow quality scores >= 4', async () => {
+  testIfSelected('qa/SKILL.md workflow', async () => {
     const t0 = Date.now();
     const start = qaContent.indexOf('## Workflow');
     const end = qaContent.indexOf('## Health Score Rubric');
@@ -266,7 +302,7 @@ ${section}`);
     expect(scores.actionability).toBeGreaterThanOrEqual(4);
   }, 30_000);
 
-  test('qa/SKILL.md health score rubric is unambiguous', async () => {
+  testIfSelected('qa/SKILL.md health rubric', async () => {
     const t0 = Date.now();
     const start = qaContent.indexOf('## Health Score Rubric');
     const section = qaContent.slice(start);
@@ -310,8 +346,8 @@ ${section}`);
 
 // --- Part 7: Cross-skill consistency judge (C7) ---
 
-describeEval('Cross-skill consistency evals', () => {
-  test('greptile-history patterns are consistent across all skills', async () => {
+describeIfSelected('Cross-skill consistency evals', ['cross-skill greptile consistency'], () => {
+  testIfSelected('cross-skill greptile consistency', async () => {
     const t0 = Date.now();
     const reviewContent = fs.readFileSync(path.join(ROOT, 'review', 'SKILL.md'), 'utf-8');
     const shipContent = fs.readFileSync(path.join(ROOT, 'ship', 'SKILL.md'), 'utf-8');
@@ -375,10 +411,10 @@ score (1-5): 5 = perfectly consistent, 1 = contradictory`);
 
 // --- Part 7: Baseline score pinning (C9) ---
 
-describeEval('Baseline score pinning', () => {
+describeIfSelected('Baseline score pinning', ['baseline score pinning'], () => {
   const baselinesPath = path.join(ROOT, 'test', 'fixtures', 'eval-baselines.json');
 
-  test('LLM eval scores do not regress below baselines', async () => {
+  testIfSelected('baseline score pinning', async () => {
     const t0 = Date.now();
     if (!fs.existsSync(baselinesPath)) {
       console.log('No baseline file found — skipping pinning check');
diff --git a/test/touchfiles.test.ts b/test/touchfiles.test.ts
new file mode 100644
index 00000000..e666bb3d
--- /dev/null
+++ b/test/touchfiles.test.ts
@@ -0,0 +1,253 @@
+/**
+ * Unit tests for diff-based test selection.
+ * Free (no API calls), runs with `bun test`.
+ */
+
+import { describe, test, expect } from 'bun:test';
+import { spawnSync } from 'child_process';
+import * as fs from 'fs';
+import * as path from 'path';
+import * as os from 'os';
+import {
+  matchGlob,
+  selectTests,
+  detectBaseBranch,
+  E2E_TOUCHFILES,
+  LLM_JUDGE_TOUCHFILES,
+  GLOBAL_TOUCHFILES,
+} from './helpers/touchfiles';
+
+const ROOT = path.resolve(import.meta.dir, '..');
+
+// --- matchGlob ---
+
+describe('matchGlob', () => {
+  test('** matches any depth of path segments', () => {
+    expect(matchGlob('browse/src/commands.ts', 'browse/src/**')).toBe(true);
+    expect(matchGlob('browse/src/deep/nested/file.ts', 'browse/src/**')).toBe(true);
+    expect(matchGlob('browse/src/cli.ts', 'browse/src/**')).toBe(true);
+  });
+
+  test('** does not match unrelated paths', () => {
+    expect(matchGlob('browse/src/commands.ts', 'qa/**')).toBe(false);
+    expect(matchGlob('review/SKILL.md', 'qa/**')).toBe(false);
+  });
+
+  test('exact match works', () => {
+    expect(matchGlob('SKILL.md', 'SKILL.md')).toBe(true);
+    expect(matchGlob('SKILL.md.tmpl', 'SKILL.md')).toBe(false);
+    expect(matchGlob('qa/SKILL.md', 'SKILL.md')).toBe(false);
+  });
+
+  test('* matches within a single segment', () => {
+    expect(matchGlob('test/fixtures/review-eval-enum.rb', 'test/fixtures/review-eval-enum*.rb')).toBe(true);
+    expect(matchGlob('test/fixtures/review-eval-enum-diff.rb', 'test/fixtures/review-eval-enum*.rb')).toBe(true);
+    expect(matchGlob('test/fixtures/review-eval-vuln.rb', 'test/fixtures/review-eval-enum*.rb')).toBe(false);
+  });
+
+  test('dots in patterns are escaped correctly', () => {
+    expect(matchGlob('SKILL.md', 'SKILL.md')).toBe(true);
+    expect(matchGlob('SKILLxmd', 'SKILL.md')).toBe(false);
+  });
+
+  test('** at end matches files in the directory', () => {
+    expect(matchGlob('qa/SKILL.md', 'qa/**')).toBe(true);
+    expect(matchGlob('qa/SKILL.md.tmpl', 'qa/**')).toBe(true);
+    expect(matchGlob('qa/templates/report.md', 'qa/**')).toBe(true);
+  });
+});
+
+// --- selectTests ---
+
+describe('selectTests', () => {
+  test('browse/src change selects browse and qa tests', () => {
+    const result = selectTests(['browse/src/commands.ts'], E2E_TOUCHFILES);
+    expect(result.selected).toContain('browse-basic');
+    expect(result.selected).toContain('browse-snapshot');
+    expect(result.selected).toContain('qa-quick');
+    expect(result.selected).toContain('qa-fix-loop');
+    expect(result.selected).toContain('qa-design-review-fix');
+    expect(result.reason).toBe('diff');
+    // Should NOT include unrelated tests
+    expect(result.selected).not.toContain('plan-ceo-review');
+    expect(result.selected).not.toContain('retro');
+    expect(result.selected).not.toContain('document-release');
+  });
+
+  test('skill-specific change selects only that skill and related tests', () => {
+    const result = selectTests(['plan-ceo-review/SKILL.md'], E2E_TOUCHFILES);
+    expect(result.selected).toContain('plan-ceo-review');
+    expect(result.selected).toContain('plan-ceo-review-selective');
+    expect(result.selected.length).toBe(2);
+    expect(result.skipped.length).toBe(Object.keys(E2E_TOUCHFILES).length - 2);
+  });
+
+  test('global touchfile triggers ALL tests', () => {
+    const result = selectTests(['test/helpers/session-runner.ts'], E2E_TOUCHFILES);
+    expect(result.selected.length).toBe(Object.keys(E2E_TOUCHFILES).length);
+    expect(result.skipped.length).toBe(0);
+    expect(result.reason).toContain('global');
+  });
+
+  test('gen-skill-docs.ts is a global touchfile', () => {
+    const result = selectTests(['scripts/gen-skill-docs.ts'], E2E_TOUCHFILES);
+    expect(result.selected.length).toBe(Object.keys(E2E_TOUCHFILES).length);
+    expect(result.reason).toContain('global');
+  });
+
+  test('unrelated file selects nothing', () => {
+    const result = selectTests(['README.md'], E2E_TOUCHFILES);
+    expect(result.selected).toEqual([]);
+    expect(result.skipped.length).toBe(Object.keys(E2E_TOUCHFILES).length);
+  });
+
+  test('empty changed files selects nothing', () => {
+    const result = selectTests([], E2E_TOUCHFILES);
+    expect(result.selected).toEqual([]);
+  });
+
+  test('multiple changed files union their selections', () => {
+    const result = selectTests(
+      ['plan-ceo-review/SKILL.md', 'retro/SKILL.md.tmpl'],
+      E2E_TOUCHFILES,
+    );
+    expect(result.selected).toContain('plan-ceo-review');
+    expect(result.selected).toContain('plan-ceo-review-selective');
+    expect(result.selected).toContain('retro');
+    expect(result.selected).toContain('retro-base-branch');
+    expect(result.selected.length).toBe(4);
+  });
+
+  test('works with LLM_JUDGE_TOUCHFILES', () => {
+    const result = selectTests(['qa/SKILL.md'], LLM_JUDGE_TOUCHFILES);
+    expect(result.selected).toContain('qa/SKILL.md workflow');
+    expect(result.selected).toContain('qa/SKILL.md health rubric');
+    expect(result.selected.length).toBe(2);
+  });
+
+  test('SKILL.md.tmpl root template only selects root-dependent tests', () => {
+    const result = selectTests(['SKILL.md.tmpl'], E2E_TOUCHFILES);
+    // Should select the 7 tests that depend on root SKILL.md
+    expect(result.selected).toContain('skillmd-setup-discovery');
+    expect(result.selected).toContain('contributor-mode');
+    expect(result.selected).toContain('session-awareness');
+    // Should NOT select unrelated tests
+    expect(result.selected).not.toContain('plan-ceo-review');
+    expect(result.selected).not.toContain('retro');
+  });
+
+  test('global touchfiles work for LLM-judge tests too', () => {
+    const result = selectTests(['scripts/gen-skill-docs.ts'], LLM_JUDGE_TOUCHFILES);
+    expect(result.selected.length).toBe(Object.keys(LLM_JUDGE_TOUCHFILES).length);
+  });
+});
+
+// --- detectBaseBranch ---
+
+describe('detectBaseBranch', () => {
+  test('detects local main branch', () => {
+    const dir = fs.mkdtempSync(path.join(os.tmpdir(), 'touchfiles-test-'));
+    const run = (cmd: string, args: string[]) =>
+      spawnSync(cmd, args, { cwd: dir, stdio: 'pipe', timeout: 5000 });
+
+    run('git', ['init']);
+    run('git', ['config', 'user.email', 'test@test.com']);
+    run('git', ['config', 'user.name', 'Test']);
+    fs.writeFileSync(path.join(dir, 'test.txt'), 'hello\n');
+    run('git', ['add', '.']);
+    run('git', ['commit', '-m', 'init']);
+
+    const result = detectBaseBranch(dir);
+    // Should find 'main' (or 'master' depending on git default)
+    expect(result).toMatch(/^(main|master)$/);
+
+    try { fs.rmSync(dir, { recursive: true, force: true }); } catch {}
+  });
+
+  test('returns null for empty repo with no branches', () => {
+    const dir = fs.mkdtempSync(path.join(os.tmpdir(), 'touchfiles-test-'));
+    const run = (cmd: string, args: string[]) =>
+      spawnSync(cmd, args, { cwd: dir, stdio: 'pipe', timeout: 5000 });
+
+    run('git', ['init']);
+    // No commits = no branches
+    const result = detectBaseBranch(dir);
+    expect(result).toBeNull();
+
+    try { fs.rmSync(dir, { recursive: true, force: true }); } catch {}
+  });
+
+  test('returns null for non-git directory', () => {
+    const dir = fs.mkdtempSync(path.join(os.tmpdir(), 'touchfiles-test-'));
+    const result = detectBaseBranch(dir);
+    expect(result).toBeNull();
+
+    try { fs.rmSync(dir, { recursive: true, force: true }); } catch {}
+  });
+});
+
+// --- Completeness: every testName in skill-e2e.test.ts has a TOUCHFILES entry ---
+
+describe('TOUCHFILES completeness', () => {
+  test('every E2E testName has a TOUCHFILES entry', () => {
+    const e2eContent = fs.readFileSync(
+      path.join(ROOT, 'test', 'skill-e2e.test.ts'),
+      'utf-8',
+    );
+
+    // Extract all testName: 'value' entries
+    const testNameRegex = /testName:\s*['"`]([^'"`]+)['"`]/g;
+    const testNames: string[] = [];
+    let match;
+    while ((match = testNameRegex.exec(e2eContent)) !== null) {
+      let name = match[1];
+      // Handle template literals like `qa-${label}` — these expand to
+      // qa-b6-static, qa-b7-spa, qa-b8-checkout
+      if (name.includes('${')) continue; // skip template literals, check expanded forms below
+      testNames.push(name);
+    }
+
+    // Add the template-expanded testNames from runPlantedBugEval calls
+    const plantedBugRegex = /runPlantedBugEval\([^,]+,\s*[^,]+,\s*['"`]([^'"`]+)['"`]\)/g;
+    while ((match = plantedBugRegex.exec(e2eContent)) !== null) {
+      testNames.push(`qa-${match[1]}`);
+    }
+
+    expect(testNames.length).toBeGreaterThan(0);
+
+    const missing = testNames.filter(name => !(name in E2E_TOUCHFILES));
+    if (missing.length > 0) {
+      throw new Error(
+        `E2E tests missing TOUCHFILES entries: ${missing.join(', ')}\n` +
+        `Add these to E2E_TOUCHFILES in test/helpers/touchfiles.ts`,
+      );
+    }
+  });
+
+  test('every LLM-judge test has a TOUCHFILES entry', () => {
+    const llmContent = fs.readFileSync(
+      path.join(ROOT, 'test', 'skill-llm-eval.test.ts'),
+      'utf-8',
+    );
+
+    // Extract test names from addTest({ name: '...' }) calls
+    const nameRegex = /name:\s*['"`]([^'"`]+)['"`]/g;
+    const testNames: string[] = [];
+    let match;
+    while ((match = nameRegex.exec(llmContent)) !== null) {
+      testNames.push(match[1]);
+    }
+
+    // Deduplicate (some tests call addTest with the same name)
+    const unique = [...new Set(testNames)];
+    expect(unique.length).toBeGreaterThan(0);
+
+    const missing = unique.filter(name => !(name in LLM_JUDGE_TOUCHFILES));
+    if (missing.length > 0) {
+      throw new Error(
+        `LLM-judge tests missing TOUCHFILES entries: ${missing.join(', ')}\n` +
+        `Add these to LLM_JUDGE_TOUCHFILES in test/helpers/touchfiles.ts`,
+      );
+    }
+  });
+});

From d8894b750fb39cd1ed2932af42c17aaa850d5c4c Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 19:09:04 -0500
Subject: [PATCH 19/22] feat: cognitive patterns for plan-review skills
 (v0.6.2) (#141)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* feat: cognitive patterns for plan-review skills — latent space activation

Enrich /plan-ceo-review, /plan-eng-review, and /plan-design-review with
researched cognitive patterns from Bezos, Grove, Munger, Horowitz, Altman,
Rams, Norman, Zhuo, Gebbia, Larson, McKinley, Brooks, Beck, and Majors.
Patterns are evocative activation keys, not checklists — they trigger the
LLM's deep knowledge of how these people actually think.

* chore: bump version and changelog (v0.6.2.0)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 CHANGELOG.md                     |  7 +++++++
 VERSION                          |  2 +-
 plan-ceo-review/SKILL.md         | 21 +++++++++++++++++++++
 plan-ceo-review/SKILL.md.tmpl    | 21 +++++++++++++++++++++
 plan-design-review/SKILL.md      | 21 +++++++++++++++++++++
 plan-design-review/SKILL.md.tmpl | 21 +++++++++++++++++++++
 plan-eng-review/SKILL.md         | 22 ++++++++++++++++++++++
 plan-eng-review/SKILL.md.tmpl    | 22 ++++++++++++++++++++++
 8 files changed, 136 insertions(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 5062711c..5df40ae8 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,12 @@
 # Changelog
 
+## [0.6.2.0] - 2026-03-17
+
+### Added
+
+- **Plan reviews now think like the best in the world.** `/plan-ceo-review` applies 14 cognitive patterns from Bezos (one-way doors, Day 1 proxy skepticism), Grove (paranoid scanning), Munger (inversion), Horowitz (wartime awareness), Chesky/Graham (founder mode), and Altman (leverage obsession). `/plan-eng-review` applies 15 patterns from Larson (team state diagnosis), McKinley (boring by default), Brooks (essential vs accidental complexity), Beck (make the change easy), Majors (own your code in production), and Google SRE (error budgets). `/plan-design-review` applies 12 patterns from Rams (subtraction default), Norman (time-horizon design), Zhuo (principled taste), Gebbia (design for trust, storyboard the journey), and Ive (care is visible).
+- **Latent space activation, not checklists.** The cognitive patterns name-drop frameworks and people so the LLM draws on its deep knowledge of how they actually think. The instruction is "internalize these, don't enumerate them" — making each review a genuine perspective shift, not a longer checklist.
+
 ## [0.6.1.0] - 2026-03-17
 
 ### Added
diff --git a/VERSION b/VERSION
index 44e7f9a2..e1e48733 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.6.1.0
+0.6.2.0
diff --git a/plan-ceo-review/SKILL.md b/plan-ceo-review/SKILL.md
index d7953a92..b44dff6d 100644
--- a/plan-ceo-review/SKILL.md
+++ b/plan-ceo-review/SKILL.md
@@ -176,6 +176,27 @@ Do NOT make any code changes. Do NOT start implementation. Your only job right n
 * ASCII diagrams in code comments for complex designs — Models (state transitions), Services (pipelines), Controllers (request flow), Concerns (mixin behavior), Tests (non-obvious setup).
 * Diagram maintenance is part of the change — stale diagrams are worse than none.
 
+## Cognitive Patterns — How Great CEOs Think
+
+These are not checklist items. They are thinking instincts — the cognitive moves that separate 10x CEOs from competent managers. Let them shape your perspective throughout the review. Don't enumerate them; internalize them.
+
+1. **Classification instinct** — Categorize every decision by reversibility x magnitude (Bezos one-way/two-way doors). Most things are two-way doors; move fast.
+2. **Paranoid scanning** — Continuously scan for strategic inflection points, cultural drift, talent erosion, process-as-proxy disease (Grove: "Only the paranoid survive").
+3. **Inversion reflex** — For every "how do we win?" also ask "what would make us fail?" (Munger).
+4. **Focus as subtraction** — Primary value-add is what to *not* do. Jobs went from 350 products to 10. Default: do fewer things, better.
+5. **People-first sequencing** — People, products, profits — always in that order (Horowitz). Talent density solves most other problems (Hastings).
+6. **Speed calibration** — Fast is default. Only slow down for irreversible + high-magnitude decisions. 70% information is enough to decide (Bezos).
+7. **Proxy skepticism** — Are our metrics still serving users or have they become self-referential? (Bezos Day 1).
+8. **Narrative coherence** — Hard decisions need clear framing. Make the "why" legible, not everyone happy.
+9. **Temporal depth** — Think in 5-10 year arcs. Apply regret minimization for major bets (Bezos at age 80).
+10. **Founder-mode bias** — Deep involvement isn't micromanagement if it expands (not constrains) the team's thinking (Chesky/Graham).
+11. **Wartime awareness** — Correctly diagnose peacetime vs wartime. Peacetime habits kill wartime companies (Horowitz).
+12. **Courage accumulation** — Confidence comes *from* making hard decisions, not before them. "The struggle IS the job."
+13. **Willfulness as strategy** — Be intentionally willful. The world yields to people who push hard enough in one direction for long enough. Most people give up too early (Altman).
+14. **Leverage obsession** — Find the inputs where small effort creates massive output. Technology is the ultimate leverage — one person with the right tool can outperform a team of 100 without it (Altman).
+
+When you evaluate architecture, think through the inversion reflex. When you challenge scope, apply focus as subtraction. When you assess timeline, use speed calibration. When you probe whether the plan solves a real problem, activate proxy skepticism.
+
 ## Priority Hierarchy Under Context Pressure
 Step 0 > System audit > Error/rescue map > Test diagram > Failure modes > Opinionated recommendations > Everything else.
 Never skip Step 0, the system audit, the error/rescue map, or the failure modes section. These are the highest-leverage outputs.
diff --git a/plan-ceo-review/SKILL.md.tmpl b/plan-ceo-review/SKILL.md.tmpl
index 8695dd8b..0616a4cc 100644
--- a/plan-ceo-review/SKILL.md.tmpl
+++ b/plan-ceo-review/SKILL.md.tmpl
@@ -55,6 +55,27 @@ Do NOT make any code changes. Do NOT start implementation. Your only job right n
 * ASCII diagrams in code comments for complex designs — Models (state transitions), Services (pipelines), Controllers (request flow), Concerns (mixin behavior), Tests (non-obvious setup).
 * Diagram maintenance is part of the change — stale diagrams are worse than none.
 
+## Cognitive Patterns — How Great CEOs Think
+
+These are not checklist items. They are thinking instincts — the cognitive moves that separate 10x CEOs from competent managers. Let them shape your perspective throughout the review. Don't enumerate them; internalize them.
+
+1. **Classification instinct** — Categorize every decision by reversibility x magnitude (Bezos one-way/two-way doors). Most things are two-way doors; move fast.
+2. **Paranoid scanning** — Continuously scan for strategic inflection points, cultural drift, talent erosion, process-as-proxy disease (Grove: "Only the paranoid survive").
+3. **Inversion reflex** — For every "how do we win?" also ask "what would make us fail?" (Munger).
+4. **Focus as subtraction** — Primary value-add is what to *not* do. Jobs went from 350 products to 10. Default: do fewer things, better.
+5. **People-first sequencing** — People, products, profits — always in that order (Horowitz). Talent density solves most other problems (Hastings).
+6. **Speed calibration** — Fast is default. Only slow down for irreversible + high-magnitude decisions. 70% information is enough to decide (Bezos).
+7. **Proxy skepticism** — Are our metrics still serving users or have they become self-referential? (Bezos Day 1).
+8. **Narrative coherence** — Hard decisions need clear framing. Make the "why" legible, not everyone happy.
+9. **Temporal depth** — Think in 5-10 year arcs. Apply regret minimization for major bets (Bezos at age 80).
+10. **Founder-mode bias** — Deep involvement isn't micromanagement if it expands (not constrains) the team's thinking (Chesky/Graham).
+11. **Wartime awareness** — Correctly diagnose peacetime vs wartime. Peacetime habits kill wartime companies (Horowitz).
+12. **Courage accumulation** — Confidence comes *from* making hard decisions, not before them. "The struggle IS the job."
+13. **Willfulness as strategy** — Be intentionally willful. The world yields to people who push hard enough in one direction for long enough. Most people give up too early (Altman).
+14. **Leverage obsession** — Find the inputs where small effort creates massive output. Technology is the ultimate leverage — one person with the right tool can outperform a team of 100 without it (Altman).
+
+When you evaluate architecture, think through the inversion reflex. When you challenge scope, apply focus as subtraction. When you assess timeline, use speed calibration. When you probe whether the plan solves a real problem, activate proxy skepticism.
+
 ## Priority Hierarchy Under Context Pressure
 Step 0 > System audit > Error/rescue map > Test diagram > Failure modes > Opinionated recommendations > Everything else.
 Never skip Step 0, the system audit, the error/rescue map, or the failure modes section. These are the highest-leverage outputs.
diff --git a/plan-design-review/SKILL.md b/plan-design-review/SKILL.md
index f0b2fddd..a8f3498e 100644
--- a/plan-design-review/SKILL.md
+++ b/plan-design-review/SKILL.md
@@ -125,6 +125,27 @@ Slug: lowercase, hyphens, max 60 chars (e.g. `browse-js-no-await`). Skip if file
 
 You are a senior product designer reviewing a live site. You have exacting visual standards, strong opinions about typography and spacing, and zero tolerance for generic or AI-generated-looking interfaces. You do NOT care whether things "work." You care whether they feel right, look intentional, and respect the user.
 
+## Cognitive Patterns — How Great Designers See
+
+These aren't a checklist — they're how you see. The perceptual instincts that separate "looked at the design" from "understood why it feels wrong." Let them run automatically as you audit.
+
+1. **Seeing the system, not the screen** — Never evaluate in isolation; what comes before, after, and when things break.
+2. **Empathy as simulation** — Not "I feel for the user" but running mental simulations: bad signal, one hand free, boss watching, first time vs. 1000th time.
+3. **Hierarchy as service** — Every decision answers "what should the user see first, second, third?" Respecting their time, not prettifying pixels.
+4. **Constraint worship** — Limitations force clarity. "If I can only show 3 things, which 3 matter most?"
+5. **The question reflex** — First instinct is questions, not opinions. "Who is this for? What did they try before this?"
+6. **Edge case paranoia** — What if the name is 47 chars? Zero results? Network fails? Colorblind? RTL language?
+7. **The "Would I notice?" test** — Invisible = perfect. The highest compliment is not noticing the design.
+8. **Principled taste** — "This feels wrong" is traceable to a broken principle. Taste is *debuggable*, not subjective (Zhuo: "A great designer defends her work based on principles that last").
+9. **Subtraction default** — "As little design as possible" (Rams). "Subtract the obvious, add the meaningful" (Maeda).
+10. **Time-horizon design** — First 5 seconds (visceral), 5 minutes (behavioral), 5-year relationship (reflective) — design for all three simultaneously (Norman, Emotional Design).
+11. **Design for trust** — Every design decision either builds or erodes trust. Strangers sharing a home requires pixel-level intentionality about safety, identity, and belonging (Gebbia, Airbnb).
+12. **Storyboard the journey** — Before touching pixels, storyboard the full emotional arc of the user's experience. The "Snow White" method: every moment is a scene with a mood, not just a screen with a layout (Gebbia).
+
+Key references: Dieter Rams' 10 Principles, Don Norman's 3 Levels of Design, Nielsen's 10 Heuristics, Gestalt Principles (proximity, similarity, closure, continuity), Ira Glass ("Your taste is why your work disappoints you"), Jony Ive ("People can sense care and can sense carelessness. Different and new is relatively easy. Doing something that's genuinely better is very hard."), Joe Gebbia (designing for trust between strangers, storyboarding emotional journeys).
+
+When auditing a page, empathy as simulation runs automatically. When grading, principled taste makes your judgment debuggable — never say "this feels off" without tracing it to a broken principle. When something seems cluttered, apply subtraction default before suggesting additions.
+
 ## Setup
 
 **Parse the user's request for these parameters:**
diff --git a/plan-design-review/SKILL.md.tmpl b/plan-design-review/SKILL.md.tmpl
index 97546805..f8ecb25a 100644
--- a/plan-design-review/SKILL.md.tmpl
+++ b/plan-design-review/SKILL.md.tmpl
@@ -21,6 +21,27 @@ allowed-tools:
 
 You are a senior product designer reviewing a live site. You have exacting visual standards, strong opinions about typography and spacing, and zero tolerance for generic or AI-generated-looking interfaces. You do NOT care whether things "work." You care whether they feel right, look intentional, and respect the user.
 
+## Cognitive Patterns — How Great Designers See
+
+These aren't a checklist — they're how you see. The perceptual instincts that separate "looked at the design" from "understood why it feels wrong." Let them run automatically as you audit.
+
+1. **Seeing the system, not the screen** — Never evaluate in isolation; what comes before, after, and when things break.
+2. **Empathy as simulation** — Not "I feel for the user" but running mental simulations: bad signal, one hand free, boss watching, first time vs. 1000th time.
+3. **Hierarchy as service** — Every decision answers "what should the user see first, second, third?" Respecting their time, not prettifying pixels.
+4. **Constraint worship** — Limitations force clarity. "If I can only show 3 things, which 3 matter most?"
+5. **The question reflex** — First instinct is questions, not opinions. "Who is this for? What did they try before this?"
+6. **Edge case paranoia** — What if the name is 47 chars? Zero results? Network fails? Colorblind? RTL language?
+7. **The "Would I notice?" test** — Invisible = perfect. The highest compliment is not noticing the design.
+8. **Principled taste** — "This feels wrong" is traceable to a broken principle. Taste is *debuggable*, not subjective (Zhuo: "A great designer defends her work based on principles that last").
+9. **Subtraction default** — "As little design as possible" (Rams). "Subtract the obvious, add the meaningful" (Maeda).
+10. **Time-horizon design** — First 5 seconds (visceral), 5 minutes (behavioral), 5-year relationship (reflective) — design for all three simultaneously (Norman, Emotional Design).
+11. **Design for trust** — Every design decision either builds or erodes trust. Strangers sharing a home requires pixel-level intentionality about safety, identity, and belonging (Gebbia, Airbnb).
+12. **Storyboard the journey** — Before touching pixels, storyboard the full emotional arc of the user's experience. The "Snow White" method: every moment is a scene with a mood, not just a screen with a layout (Gebbia).
+
+Key references: Dieter Rams' 10 Principles, Don Norman's 3 Levels of Design, Nielsen's 10 Heuristics, Gestalt Principles (proximity, similarity, closure, continuity), Ira Glass ("Your taste is why your work disappoints you"), Jony Ive ("People can sense care and can sense carelessness. Different and new is relatively easy. Doing something that's genuinely better is very hard."), Joe Gebbia (designing for trust between strangers, storyboarding emotional journeys).
+
+When auditing a page, empathy as simulation runs automatically. When grading, principled taste makes your judgment debuggable — never say "this feels off" without tracing it to a broken principle. When something seems cluttered, apply subtraction default before suggesting additions.
+
 ## Setup
 
 **Parse the user's request for these parameters:**
diff --git a/plan-eng-review/SKILL.md b/plan-eng-review/SKILL.md
index d2292af6..05c74ba7 100644
--- a/plan-eng-review/SKILL.md
+++ b/plan-eng-review/SKILL.md
@@ -135,6 +135,28 @@ If you are running low on context or the user asks you to compress: Step 0 > Tes
 * Bias toward explicit over clever.
 * Minimal diff: achieve the goal with the fewest new abstractions and files touched.
 
+## Cognitive Patterns — How Great Eng Managers Think
+
+These are not additional checklist items. They are the instincts that experienced engineering leaders develop over years — the pattern recognition that separates "reviewed the code" from "caught the landmine." Apply them throughout your review.
+
+1. **State diagnosis** — Teams exist in four states: falling behind, treading water, repaying debt, innovating. Each demands a different intervention (Larson, An Elegant Puzzle).
+2. **Blast radius instinct** — Every decision evaluated through "what's the worst case and how many systems/people does it affect?"
+3. **Boring by default** — "Every company gets about three innovation tokens." Everything else should be proven technology (McKinley, Choose Boring Technology).
+4. **Incremental over revolutionary** — Strangler fig, not big bang. Canary, not global rollout. Refactor, not rewrite (Fowler).
+5. **Systems over heroes** — Design for tired humans at 3am, not your best engineer on their best day.
+6. **Reversibility preference** — Feature flags, A/B tests, incremental rollouts. Make the cost of being wrong low.
+7. **Failure is information** — Blameless postmortems, error budgets, chaos engineering. Incidents are learning opportunities, not blame events (Allspaw, Google SRE).
+8. **Org structure IS architecture** — Conway's Law in practice. Design both intentionally (Skelton/Pais, Team Topologies).
+9. **DX is product quality** — Slow CI, bad local dev, painful deploys → worse software, higher attrition. Developer experience is a leading indicator.
+10. **Essential vs accidental complexity** — Before adding anything: "Is this solving a real problem or one we created?" (Brooks, No Silver Bullet).
+11. **Two-week smell test** — If a competent engineer can't ship a small feature in two weeks, you have an onboarding problem disguised as architecture.
+12. **Glue work awareness** — Recognize invisible coordination work. Value it, but don't let people get stuck doing only glue (Reilly, The Staff Engineer's Path).
+13. **Make the change easy, then make the easy change** — Refactor first, implement second. Never structural + behavioral changes simultaneously (Beck).
+14. **Own your code in production** — No wall between dev and ops. "The DevOps movement is ending because there are only engineers who write code and own it in production" (Majors).
+15. **Error budgets over uptime targets** — SLO of 99.9% = 0.1% downtime *budget to spend on shipping*. Reliability is resource allocation (Google SRE).
+
+When evaluating architecture, think "boring by default." When reviewing tests, think "systems over heroes." When assessing complexity, ask Brooks's question. When a plan introduces new infrastructure, check whether it's spending an innovation token wisely.
+
 ## Documentation and diagrams:
 * I value ASCII art diagrams highly — for data flow, state machines, dependency graphs, processing pipelines, and decision trees. Use them liberally in plans and design docs.
 * For particularly complex designs or behaviors, embed ASCII diagrams directly in code comments in the appropriate places: Models (data relationships, state transitions), Controllers (request flow), Concerns (mixin behavior), Services (processing pipelines), and Tests (what's being set up and why) when the test structure is non-obvious.
diff --git a/plan-eng-review/SKILL.md.tmpl b/plan-eng-review/SKILL.md.tmpl
index bf033606..91f24719 100644
--- a/plan-eng-review/SKILL.md.tmpl
+++ b/plan-eng-review/SKILL.md.tmpl
@@ -31,6 +31,28 @@ If you are running low on context or the user asks you to compress: Step 0 > Tes
 * Bias toward explicit over clever.
 * Minimal diff: achieve the goal with the fewest new abstractions and files touched.
 
+## Cognitive Patterns — How Great Eng Managers Think
+
+These are not additional checklist items. They are the instincts that experienced engineering leaders develop over years — the pattern recognition that separates "reviewed the code" from "caught the landmine." Apply them throughout your review.
+
+1. **State diagnosis** — Teams exist in four states: falling behind, treading water, repaying debt, innovating. Each demands a different intervention (Larson, An Elegant Puzzle).
+2. **Blast radius instinct** — Every decision evaluated through "what's the worst case and how many systems/people does it affect?"
+3. **Boring by default** — "Every company gets about three innovation tokens." Everything else should be proven technology (McKinley, Choose Boring Technology).
+4. **Incremental over revolutionary** — Strangler fig, not big bang. Canary, not global rollout. Refactor, not rewrite (Fowler).
+5. **Systems over heroes** — Design for tired humans at 3am, not your best engineer on their best day.
+6. **Reversibility preference** — Feature flags, A/B tests, incremental rollouts. Make the cost of being wrong low.
+7. **Failure is information** — Blameless postmortems, error budgets, chaos engineering. Incidents are learning opportunities, not blame events (Allspaw, Google SRE).
+8. **Org structure IS architecture** — Conway's Law in practice. Design both intentionally (Skelton/Pais, Team Topologies).
+9. **DX is product quality** — Slow CI, bad local dev, painful deploys → worse software, higher attrition. Developer experience is a leading indicator.
+10. **Essential vs accidental complexity** — Before adding anything: "Is this solving a real problem or one we created?" (Brooks, No Silver Bullet).
+11. **Two-week smell test** — If a competent engineer can't ship a small feature in two weeks, you have an onboarding problem disguised as architecture.
+12. **Glue work awareness** — Recognize invisible coordination work. Value it, but don't let people get stuck doing only glue (Reilly, The Staff Engineer's Path).
+13. **Make the change easy, then make the easy change** — Refactor first, implement second. Never structural + behavioral changes simultaneously (Beck).
+14. **Own your code in production** — No wall between dev and ops. "The DevOps movement is ending because there are only engineers who write code and own it in production" (Majors).
+15. **Error budgets over uptime targets** — SLO of 99.9% = 0.1% downtime *budget to spend on shipping*. Reliability is resource allocation (Google SRE).
+
+When evaluating architecture, think "boring by default." When reviewing tests, think "systems over heroes." When assessing complexity, ask Brooks's question. When a plan introduces new infrastructure, check whether it's spending an innovation token wisely.
+
 ## Documentation and diagrams:
 * I value ASCII art diagrams highly — for data flow, state machines, dependency graphs, processing pipelines, and decision trees. Use them liberally in plans and design docs.
 * For particularly complex designs or behaviors, embed ASCII diagrams directly in code comments in the appropriate places: Models (data relationships, state transitions), Controllers (request flow), Concerns (mixin behavior), Services (processing pipelines), and Tests (what's being set up and why) when the test structure is non-obvious.

From 28becb3b395c76f163d368aa20cfadc7cb686988 Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 20:12:55 -0500
Subject: [PATCH 20/22] feat: design review lite in /review and /ship +
 gstack-diff-scope (v0.6.3) (#142)

* feat: gstack-diff-scope helper + design review checklist

bin/gstack-diff-scope categorizes branch changes into SCOPE_FRONTEND,
SCOPE_BACKEND, SCOPE_PROMPTS, SCOPE_TESTS, SCOPE_DOCS, SCOPE_CONFIG.

review/design-checklist.md is a 20-item code-level checklist with
HIGH/MEDIUM/LOW confidence tags for detecting design anti-patterns
from source code.

* feat: integrate design review lite into /review and /ship

Add generateDesignReviewLite() resolver, insert {{DESIGN_REVIEW_LITE}}
partial in review Step 4.5 and ship Step 3.5. Update dashboard to
recognize design-review-lite entries. Ship pre-flight uses
gstack-diff-scope for smarter design review recommendations.

* test: E2E eval for design review lite detection

Planted CSS/HTML fixtures with 7 design anti-patterns. E2E test
verifies /review catches >= 4 of 7 (Papyrus font, 14px body text,
outline:none, !important, purple gradient, generic hero copy,
3-column feature grid).

* chore: bump version and changelog (v0.6.3.0)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

---------

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
---
 CHANGELOG.md                               |   9 ++
 TODOS.md                                   |  12 +-
 VERSION                                    |   2 +-
 bin/gstack-diff-scope                      |  71 +++++++++++
 plan-ceo-review/SKILL.md                   |   2 +-
 plan-design-review/SKILL.md                |   2 +-
 plan-eng-review/SKILL.md                   |   2 +-
 review/SKILL.md                            |  41 +++++++
 review/SKILL.md.tmpl                       |   8 ++
 review/design-checklist.md                 | 132 +++++++++++++++++++++
 scripts/gen-skill-docs.ts                  |  42 ++++++-
 ship/SKILL.md                              |  48 +++++++-
 ship/SKILL.md.tmpl                         |  13 +-
 test/fixtures/review-eval-design-slop.css  |  86 ++++++++++++++
 test/fixtures/review-eval-design-slop.html |  41 +++++++
 test/helpers/touchfiles.ts                 |   1 +
 test/skill-e2e.test.ts                     |  91 ++++++++++++++
 17 files changed, 587 insertions(+), 16 deletions(-)
 create mode 100755 bin/gstack-diff-scope
 create mode 100644 review/design-checklist.md
 create mode 100644 test/fixtures/review-eval-design-slop.css
 create mode 100644 test/fixtures/review-eval-design-slop.html

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 5df40ae8..04f690a3 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,14 @@
 # Changelog
 
+## [0.6.3.0] - 2026-03-17
+
+### Added
+
+- **Every PR touching frontend code now gets a design review automatically.** `/review` and `/ship` apply a 20-item design checklist against changed CSS, HTML, JSX, and view files. Catches AI slop patterns (purple gradients, 3-column icon grids, generic hero copy), typography issues (body text < 16px, blacklisted fonts), accessibility gaps (`outline: none`), and `!important` abuse. Mechanical CSS fixes are auto-applied; design judgment calls ask you first.
+- **`gstack-diff-scope` categorizes what changed in your branch.** Run `eval $(gstack-diff-scope main)` and get `SCOPE_FRONTEND=true/false`, `SCOPE_BACKEND`, `SCOPE_PROMPTS`, `SCOPE_TESTS`, `SCOPE_DOCS`, `SCOPE_CONFIG`. Design review uses it to skip silently on backend-only PRs. Ship pre-flight uses it to recommend design review when frontend files are touched.
+- **Design review shows up in the Review Readiness Dashboard.** The dashboard now distinguishes between "LITE" (code-level, runs automatically in /review and /ship) and "FULL" (visual audit via /plan-design-review with browse binary). Both show up as Design Review entries.
+- **E2E eval for design review detection.** Planted CSS/HTML fixtures with 7 known anti-patterns (Papyrus font, 14px body text, `outline: none`, `!important`, purple gradient, generic hero copy, 3-column feature grid). The eval verifies `/review` catches at least 4 of 7.
+
 ## [0.6.2.0] - 2026-03-17
 
 ### Added
diff --git a/TODOS.md b/TODOS.md
index 8616f906..5f771de7 100644
--- a/TODOS.md
+++ b/TODOS.md
@@ -444,17 +444,17 @@ Shipped as `/design-consultation` on garrytan/design branch. Renamed from `/setu
 
 ## Ship Confidence Dashboard
 
-### Smart review relevance detection
+### Smart review relevance detection — PARTIALLY SHIPPED
 
-**What:** Auto-detect which of the 4 reviews are relevant based on branch changes (skip Design Review if no CSS/view changes, skip Code Review if plan-only).
+~~**What:** Auto-detect which of the 4 reviews are relevant based on branch changes (skip Design Review if no CSS/view changes, skip Code Review if plan-only).~~
 
-**Why:** Currently dashboard always shows 4 rows. On docs-only changes, "Design Review: NOT YET RUN" is noise.
+`bin/gstack-diff-scope` shipped — categorizes diff into SCOPE_FRONTEND, SCOPE_BACKEND, SCOPE_PROMPTS, SCOPE_TESTS, SCOPE_DOCS, SCOPE_CONFIG. Used by design-review-lite to skip when no frontend files changed. Dashboard integration for conditional row display is a follow-up.
 
-**Context:** /plan-design-review and /qa already do file-type detection in diff-aware mode. Could reuse that heuristic. Would require a `gstack-diff-scope` helper or enriching `gstack-slug` to also output change categories.
+**Remaining:** Dashboard conditional row display (hide "Design Review: NOT YET RUN" when SCOPE_FRONTEND=false). Extend to Eng Review (skip for docs-only) and CEO Review (skip for config-only).
 
-**Effort:** M
+**Effort:** S
 **Priority:** P3
-**Depends on:** Ship Confidence Dashboard (shipped)
+**Depends on:** gstack-diff-scope (shipped)
 
 ### /merge skill — review-gated PR merge
 
diff --git a/VERSION b/VERSION
index e1e48733..1e40a508 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-0.6.2.0
+0.6.3.0
diff --git a/bin/gstack-diff-scope b/bin/gstack-diff-scope
new file mode 100755
index 00000000..ada66c0a
--- /dev/null
+++ b/bin/gstack-diff-scope
@@ -0,0 +1,71 @@
+#!/usr/bin/env bash
+# gstack-diff-scope — categorize what changed in the diff against a base branch
+# Usage: eval $(gstack-diff-scope main)  → sets SCOPE_FRONTEND=true SCOPE_BACKEND=false ...
+# Or:    gstack-diff-scope main           → prints SCOPE_*=... lines
+set -euo pipefail
+
+BASE="${1:-main}"
+
+# Get changed file list
+FILES=$(git diff "${BASE}...HEAD" --name-only 2>/dev/null || git diff "${BASE}" --name-only 2>/dev/null || echo "")
+
+if [ -z "$FILES" ]; then
+  echo "SCOPE_FRONTEND=false"
+  echo "SCOPE_BACKEND=false"
+  echo "SCOPE_PROMPTS=false"
+  echo "SCOPE_TESTS=false"
+  echo "SCOPE_DOCS=false"
+  echo "SCOPE_CONFIG=false"
+  exit 0
+fi
+
+FRONTEND=false
+BACKEND=false
+PROMPTS=false
+TESTS=false
+DOCS=false
+CONFIG=false
+
+while IFS= read -r f; do
+  case "$f" in
+    # Frontend: CSS, views, components, templates
+    *.css|*.scss|*.less|*.sass|*.pcss|*.module.css|*.module.scss) FRONTEND=true ;;
+    *.tsx|*.jsx|*.vue|*.svelte|*.astro) FRONTEND=true ;;
+    *.erb|*.haml|*.slim|*.hbs|*.ejs) FRONTEND=true ;;
+    *.html) FRONTEND=true ;;
+    tailwind.config.*|postcss.config.*) FRONTEND=true ;;
+    app/views/*|*/components/*|styles/*|css/*|app/assets/stylesheets/*) FRONTEND=true ;;
+
+    # Prompts: prompt builders, system prompts, generation services
+    *prompt_builder*|*generation_service*|*writer_service*|*designer_service*) PROMPTS=true ;;
+    *evaluator*|*scorer*|*classifier_service*|*analyzer*) PROMPTS=true ;;
+    *voice*.rb|*writing*.rb|*prompt*.rb|*token*.rb) PROMPTS=true ;;
+    app/services/chat_tools/*|app/services/x_thread_tools/*) PROMPTS=true ;;
+    config/system_prompts/*) PROMPTS=true ;;
+
+    # Tests
+    *.test.*|*.spec.*|*_test.*|*_spec.*) TESTS=true ;;
+    test/*|tests/*|spec/*|__tests__/*|cypress/*|e2e/*) TESTS=true ;;
+
+    # Docs
+    *.md) DOCS=true ;;
+
+    # Config
+    package.json|package-lock.json|yarn.lock|bun.lockb) CONFIG=true ;;
+    Gemfile|Gemfile.lock) CONFIG=true ;;
+    *.yml|*.yaml) CONFIG=true ;;
+    .github/*) CONFIG=true ;;
+    requirements.txt|pyproject.toml|go.mod|Cargo.toml|composer.json) CONFIG=true ;;
+
+    # Backend: everything else that's code (excluding views/components already matched)
+    *.rb|*.py|*.go|*.rs|*.java|*.php|*.ex|*.exs) BACKEND=true ;;
+    *.ts|*.js) BACKEND=true ;;  # Non-component TS/JS is backend
+  esac
+done <<< "$FILES"
+
+echo "SCOPE_FRONTEND=$FRONTEND"
+echo "SCOPE_BACKEND=$BACKEND"
+echo "SCOPE_PROMPTS=$PROMPTS"
+echo "SCOPE_TESTS=$TESTS"
+echo "SCOPE_DOCS=$DOCS"
+echo "SCOPE_CONFIG=$CONFIG"
diff --git a/plan-ceo-review/SKILL.md b/plan-ceo-review/SKILL.md
index b44dff6d..55238e3f 100644
--- a/plan-ceo-review/SKILL.md
+++ b/plan-ceo-review/SKILL.md
@@ -702,7 +702,7 @@ echo "---CONFIG---"
 ~/.claude/skills/gstack/bin/gstack-config get skip_eng_review 2>/dev/null || echo "false"
 ```
 
-Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
+Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review, design-review-lite). Ignore entries with timestamps older than 7 days. For Design Review, show whichever is more recent between `plan-design-review` (full visual audit) and `design-review-lite` (code-level check). Append "(FULL)" or "(LITE)" to the status to distinguish. Display:
 
 ```
 +====================================================================+
diff --git a/plan-design-review/SKILL.md b/plan-design-review/SKILL.md
index a8f3498e..1d821bf2 100644
--- a/plan-design-review/SKILL.md
+++ b/plan-design-review/SKILL.md
@@ -645,7 +645,7 @@ echo "---CONFIG---"
 ~/.claude/skills/gstack/bin/gstack-config get skip_eng_review 2>/dev/null || echo "false"
 ```
 
-Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
+Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review, design-review-lite). Ignore entries with timestamps older than 7 days. For Design Review, show whichever is more recent between `plan-design-review` (full visual audit) and `design-review-lite` (code-level check). Append "(FULL)" or "(LITE)" to the status to distinguish. Display:
 
 ```
 +====================================================================+
diff --git a/plan-eng-review/SKILL.md b/plan-eng-review/SKILL.md
index 05c74ba7..48fe7230 100644
--- a/plan-eng-review/SKILL.md
+++ b/plan-eng-review/SKILL.md
@@ -348,7 +348,7 @@ echo "---CONFIG---"
 ~/.claude/skills/gstack/bin/gstack-config get skip_eng_review 2>/dev/null || echo "false"
 ```
 
-Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
+Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review, design-review-lite). Ignore entries with timestamps older than 7 days. For Design Review, show whichever is more recent between `plan-design-review` (full visual audit) and `design-review-lite` (code-level check). Append "(FULL)" or "(LITE)" to the status to distinguish. Display:
 
 ```
 +====================================================================+
diff --git a/review/SKILL.md b/review/SKILL.md
index 186978ef..5d734594 100644
--- a/review/SKILL.md
+++ b/review/SKILL.md
@@ -196,6 +196,47 @@ Follow the output format specified in the checklist. Respect the suppressions 
 
 ---
 
+## Step 4.5: Design Review (conditional)
+
+## Design Review (conditional, diff-scoped)
+
+Check if the diff touches frontend files using `gstack-diff-scope`:
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-diff-scope <base> 2>/dev/null)
+```
+
+**If `SCOPE_FRONTEND=false`:** Skip design review silently. No output.
+
+**If `SCOPE_FRONTEND=true`:**
+
+1. **Check for DESIGN.md.** If `DESIGN.md` or `design-system.md` exists in the repo root, read it. All design findings are calibrated against it — patterns blessed in DESIGN.md are not flagged. If not found, use universal design principles.
+
+2. **Read `.claude/skills/review/design-checklist.md`.** If the file cannot be read, skip design review with a note: "Design checklist not found — skipping design review."
+
+3. **Read each changed frontend file** (full file, not just diff hunks). Frontend files are identified by the patterns listed in the checklist.
+
+4. **Apply the design checklist** against the changed files. For each item:
+   - **[HIGH] mechanical CSS fix** (`outline: none`, `!important`, `font-size < 16px`): classify as AUTO-FIX
+   - **[HIGH/MEDIUM] design judgment needed**: classify as ASK
+   - **[LOW] intent-based detection**: present as "Possible — verify visually or run /qa-design-review"
+
+5. **Include findings** in the review output under a "Design Review" header, following the output format in the checklist. Design findings merge with code review findings into the same Fix-First flow.
+
+6. **Log the result** for the Review Readiness Dashboard:
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+mkdir -p ~/.gstack/projects/$SLUG
+echo '{"skill":"design-review-lite","timestamp":"TIMESTAMP","status":"STATUS","findings":N,"auto_fixed":M}' >> ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl
+```
+
+Substitute: TIMESTAMP = ISO 8601 datetime, STATUS = "clean" if 0 findings or "issues_found", N = total findings, M = auto-fixed count.
+
+Include any design findings alongside the findings from Step 4. They follow the same Fix-First flow in Step 5 — AUTO-FIX for mechanical CSS fixes, ASK for everything else.
+
+---
+
 ## Step 5: Fix-First Review
 
 **Every finding gets action — not just critical ones.**
diff --git a/review/SKILL.md.tmpl b/review/SKILL.md.tmpl
index c122ada1..c1d3fae6 100644
--- a/review/SKILL.md.tmpl
+++ b/review/SKILL.md.tmpl
@@ -75,6 +75,14 @@ Follow the output format specified in the checklist. Respect the suppressions 
 
 ---
 
+## Step 4.5: Design Review (conditional)
+
+{{DESIGN_REVIEW_LITE}}
+
+Include any design findings alongside the findings from Step 4. They follow the same Fix-First flow in Step 5 — AUTO-FIX for mechanical CSS fixes, ASK for everything else.
+
+---
+
 ## Step 5: Fix-First Review
 
 **Every finding gets action — not just critical ones.**
diff --git a/review/design-checklist.md b/review/design-checklist.md
new file mode 100644
index 00000000..bbe49885
--- /dev/null
+++ b/review/design-checklist.md
@@ -0,0 +1,132 @@
+# Design Review Checklist (Lite)
+
+> **Subset of DESIGN_METHODOLOGY** — when adding items here, also update `generateDesignMethodology()` in `scripts/gen-skill-docs.ts`, and vice versa.
+
+## Instructions
+
+This checklist applies to **source code in the diff** — not rendered output. Read each changed frontend file (full file, not just diff hunks) and flag anti-patterns.
+
+**Trigger:** Only run this checklist if the diff touches frontend files. Use `gstack-diff-scope` to detect:
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-diff-scope <base> 2>/dev/null)
+```
+
+If `SCOPE_FRONTEND=false`, skip the entire design review silently.
+
+**DESIGN.md calibration:** If `DESIGN.md` or `design-system.md` exists in the repo root, read it first. All findings are calibrated against the project's stated design system. Patterns explicitly blessed in DESIGN.md are NOT flagged. If no DESIGN.md exists, use universal design principles.
+
+---
+
+## Confidence Tiers
+
+Each item is tagged with a detection confidence level:
+
+- **[HIGH]** — Reliably detectable via grep/pattern match. Definitive findings.
+- **[MEDIUM]** — Detectable via pattern aggregation or heuristic. Flag as findings but expect some noise.
+- **[LOW]** — Requires understanding visual intent. Present as: "Possible issue — verify visually or run /qa-design-review."
+
+---
+
+## Classification
+
+**AUTO-FIX** (mechanical CSS fixes only — HIGH confidence, no design judgment needed):
+- `outline: none` without replacement → add `outline: revert` or `&:focus-visible { outline: 2px solid currentColor; }`
+- `!important` in new CSS → remove and fix specificity
+- `font-size` < 16px on body text → bump to 16px
+
+**ASK** (everything else — requires design judgment):
+- All AI slop findings, typography structure, spacing choices, interaction state gaps, DESIGN.md violations
+
+**LOW confidence items** → present as "Possible: [description]. Verify visually or run /qa-design-review." Never AUTO-FIX.
+
+---
+
+## Output Format
+
+```
+Design Review: N issues (X auto-fixable, Y need input, Z possible)
+
+**AUTO-FIXED:**
+- [file:line] Problem → fix applied
+
+**NEEDS INPUT:**
+- [file:line] Problem description
+  Recommended fix: suggested fix
+
+**POSSIBLE (verify visually):**
+- [file:line] Possible issue — verify with /qa-design-review
+```
+
+If no issues found: `Design Review: No issues found.`
+
+If no frontend files changed: skip silently, no output.
+
+---
+
+## Categories
+
+### 1. AI Slop Detection (6 items) — highest priority
+
+These are the telltale signs of AI-generated UI that no designer at a respected studio would ship.
+
+- **[MEDIUM]** Purple/violet/indigo gradient backgrounds or blue-to-purple color schemes. Look for `linear-gradient` with values in the `#6366f1`–`#8b5cf6` range, or CSS custom properties resolving to purple/violet.
+
+- **[LOW]** The 3-column feature grid: icon-in-colored-circle + bold title + 2-line description, repeated 3x symmetrically. Look for a grid/flex container with exactly 3 children that each contain a circular element + heading + paragraph.
+
+- **[LOW]** Icons in colored circles as section decoration. Look for elements with `border-radius: 50%` + a background color used as decorative containers for icons.
+
+- **[HIGH]** Centered everything: `text-align: center` on all headings, descriptions, and cards. Grep for `text-align: center` density — if >60% of text containers use center alignment, flag it.
+
+- **[MEDIUM]** Uniform bubbly border-radius on every element: same large radius (16px+) applied to cards, buttons, inputs, containers uniformly. Aggregate `border-radius` values — if >80% use the same value ≥16px, flag it.
+
+- **[MEDIUM]** Generic hero copy: "Welcome to [X]", "Unlock the power of...", "Your all-in-one solution for...", "Revolutionize your...", "Streamline your workflow". Grep HTML/JSX content for these patterns.
+
+### 2. Typography (4 items)
+
+- **[HIGH]** Body text `font-size` < 16px. Grep for `font-size` declarations on `body`, `p`, `.text`, or base styles. Values below 16px (or 1rem when base is 16px) are flagged.
+
+- **[HIGH]** More than 3 font families introduced in the diff. Count distinct `font-family` declarations. Flag if >3 unique families appear across changed files.
+
+- **[HIGH]** Heading hierarchy skipping levels: `h1` followed by `h3` without an `h2` in the same file/component. Check HTML/JSX for heading tags.
+
+- **[HIGH]** Blacklisted fonts: Papyrus, Comic Sans, Lobster, Impact, Jokerman. Grep `font-family` for these names.
+
+### 3. Spacing & Layout (4 items)
+
+- **[MEDIUM]** Arbitrary spacing values not on a 4px or 8px scale, when DESIGN.md specifies a spacing scale. Check `margin`, `padding`, `gap` values against the stated scale. Only flag when DESIGN.md defines a scale.
+
+- **[MEDIUM]** Fixed widths without responsive handling: `width: NNNpx` on containers without `max-width` or `@media` breakpoints. Risk of horizontal scroll on mobile.
+
+- **[MEDIUM]** Missing `max-width` on text containers: body text or paragraph containers with no `max-width` set, allowing lines >75 characters. Check for `max-width` on text wrappers.
+
+- **[HIGH]** `!important` in new CSS rules. Grep for `!important` in added lines. Almost always a specificity escape hatch that should be fixed properly.
+
+### 4. Interaction States (3 items)
+
+- **[MEDIUM]** Interactive elements (buttons, links, inputs) missing hover/focus states. Check if `:hover` and `:focus` or `:focus-visible` pseudo-classes exist for new interactive element styles.
+
+- **[HIGH]** `outline: none` or `outline: 0` without a replacement focus indicator. Grep for `outline:\s*none` or `outline:\s*0`. This removes keyboard accessibility.
+
+- **[LOW]** Touch targets < 44px on interactive elements. Check `min-height`/`min-width`/`padding` on buttons and links. Requires computing effective size from multiple properties — low confidence from code alone.
+
+### 5. DESIGN.md Violations (3 items, conditional)
+
+Only apply if `DESIGN.md` or `design-system.md` exists:
+
+- **[MEDIUM]** Colors not in the stated palette. Compare color values in changed CSS against the palette defined in DESIGN.md.
+
+- **[MEDIUM]** Fonts not in the stated typography section. Compare `font-family` values against DESIGN.md's font list.
+
+- **[MEDIUM]** Spacing values outside the stated scale. Compare `margin`/`padding`/`gap` values against DESIGN.md's spacing scale.
+
+---
+
+## Suppressions
+
+Do NOT flag:
+- Patterns explicitly documented in DESIGN.md as intentional choices
+- Third-party/vendor CSS files (node_modules, vendor directories)
+- CSS resets or normalize stylesheets
+- Test fixture files
+- Generated/minified CSS
diff --git a/scripts/gen-skill-docs.ts b/scripts/gen-skill-docs.ts
index d2e86ecf..cb807111 100644
--- a/scripts/gen-skill-docs.ts
+++ b/scripts/gen-skill-docs.ts
@@ -519,6 +519,45 @@ Minimum 0 per category.
 11. **Show screenshots to the user.** After every \`$B screenshot\`, \`$B snapshot -a -o\`, or \`$B responsive\` command, use the Read tool on the output file(s) so the user can see them inline. For \`responsive\` (3 files), Read all three. This is critical — without it, screenshots are invisible to the user.`;
 }
 
+function generateDesignReviewLite(): string {
+  return `## Design Review (conditional, diff-scoped)
+
+Check if the diff touches frontend files using \`gstack-diff-scope\`:
+
+\`\`\`bash
+eval $(~/.claude/skills/gstack/bin/gstack-diff-scope <base> 2>/dev/null)
+\`\`\`
+
+**If \`SCOPE_FRONTEND=false\`:** Skip design review silently. No output.
+
+**If \`SCOPE_FRONTEND=true\`:**
+
+1. **Check for DESIGN.md.** If \`DESIGN.md\` or \`design-system.md\` exists in the repo root, read it. All design findings are calibrated against it — patterns blessed in DESIGN.md are not flagged. If not found, use universal design principles.
+
+2. **Read \`.claude/skills/review/design-checklist.md\`.** If the file cannot be read, skip design review with a note: "Design checklist not found — skipping design review."
+
+3. **Read each changed frontend file** (full file, not just diff hunks). Frontend files are identified by the patterns listed in the checklist.
+
+4. **Apply the design checklist** against the changed files. For each item:
+   - **[HIGH] mechanical CSS fix** (\`outline: none\`, \`!important\`, \`font-size < 16px\`): classify as AUTO-FIX
+   - **[HIGH/MEDIUM] design judgment needed**: classify as ASK
+   - **[LOW] intent-based detection**: present as "Possible — verify visually or run /qa-design-review"
+
+5. **Include findings** in the review output under a "Design Review" header, following the output format in the checklist. Design findings merge with code review findings into the same Fix-First flow.
+
+6. **Log the result** for the Review Readiness Dashboard:
+
+\`\`\`bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+mkdir -p ~/.gstack/projects/$SLUG
+echo '{"skill":"design-review-lite","timestamp":"TIMESTAMP","status":"STATUS","findings":N,"auto_fixed":M}' >> ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl
+\`\`\`
+
+Substitute: TIMESTAMP = ISO 8601 datetime, STATUS = "clean" if 0 findings or "issues_found", N = total findings, M = auto-fixed count.`;
+}
+
+// NOTE: design-checklist.md is a subset of this methodology for code-level detection.
+// When adding items here, also update review/design-checklist.md, and vice versa.
 function generateDesignMethodology(): string {
   return `## Modes
 
@@ -865,7 +904,7 @@ echo "---CONFIG---"
 ~/.claude/skills/gstack/bin/gstack-config get skip_eng_review 2>/dev/null || echo "false"
 \`\`\`
 
-Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
+Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review, design-review-lite). Ignore entries with timestamps older than 7 days. For Design Review, show whichever is more recent between \`plan-design-review\` (full visual audit) and \`design-review-lite\` (code-level check). Append "(FULL)" or "(LITE)" to the status to distinguish. Display:
 
 \`\`\`
 +====================================================================+
@@ -1056,6 +1095,7 @@ const RESOLVERS: Record<string, () => string> = {
   BASE_BRANCH_DETECT: generateBaseBranchDetect,
   QA_METHODOLOGY: generateQAMethodology,
   DESIGN_METHODOLOGY: generateDesignMethodology,
+  DESIGN_REVIEW_LITE: generateDesignReviewLite,
   REVIEW_DASHBOARD: generateReviewDashboard,
   TEST_BOOTSTRAP: generateTestBootstrap,
 };
diff --git a/ship/SKILL.md b/ship/SKILL.md
index e2b524d9..486f32bf 100644
--- a/ship/SKILL.md
+++ b/ship/SKILL.md
@@ -186,7 +186,7 @@ echo "---CONFIG---"
 ~/.claude/skills/gstack/bin/gstack-config get skip_eng_review 2>/dev/null || echo "false"
 ```
 
-Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review). Ignore entries with timestamps older than 7 days. Display:
+Parse the output. Find the most recent entry for each skill (plan-ceo-review, plan-eng-review, plan-design-review, design-review-lite). Ignore entries with timestamps older than 7 days. For Design Review, show whichever is more recent between `plan-design-review` (full visual audit) and `design-review-lite` (code-level check). Append "(FULL)" or "(LITE)" to the status to distinguish. Display:
 
 ```
 +====================================================================+
@@ -226,7 +226,8 @@ If the Eng Review is NOT "CLEAR":
    - Show that Eng Review is missing or has open issues
    - RECOMMENDATION: Choose C if the change is obviously trivial (< 20 lines, typo fix, config-only); Choose B for larger changes
    - Options: A) Ship anyway  B) Abort — run /plan-eng-review first  C) Change is too small to need eng review
-   - If CEO/Design reviews are missing, mention them as informational ("CEO Review not run — recommended for product changes") but do NOT block or recommend aborting for them
+   - If CEO Review is missing, mention as informational ("CEO Review not run — recommended for product changes") but do NOT block
+   - For Design Review: run `eval $(~/.claude/skills/gstack/bin/gstack-diff-scope <base> 2>/dev/null)`. If `SCOPE_FRONTEND=true` and no design review (plan-design-review or design-review-lite) exists in the dashboard, mention: "Design Review not run — this PR changes frontend code. The lite design check will run automatically in Step 3.5, but consider running /plan-design-review for a full visual audit." Still never block.
 
 3. **If the user chooses A or C,** persist the decision so future `/ship` runs on this branch skip the gate:
    ```bash
@@ -642,6 +643,43 @@ Review the diff for structural issues that tests don't catch.
    - **Pass 1 (CRITICAL):** SQL & Data Safety, LLM Output Trust Boundary
    - **Pass 2 (INFORMATIONAL):** All remaining categories
 
+## Design Review (conditional, diff-scoped)
+
+Check if the diff touches frontend files using `gstack-diff-scope`:
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-diff-scope <base> 2>/dev/null)
+```
+
+**If `SCOPE_FRONTEND=false`:** Skip design review silently. No output.
+
+**If `SCOPE_FRONTEND=true`:**
+
+1. **Check for DESIGN.md.** If `DESIGN.md` or `design-system.md` exists in the repo root, read it. All design findings are calibrated against it — patterns blessed in DESIGN.md are not flagged. If not found, use universal design principles.
+
+2. **Read `.claude/skills/review/design-checklist.md`.** If the file cannot be read, skip design review with a note: "Design checklist not found — skipping design review."
+
+3. **Read each changed frontend file** (full file, not just diff hunks). Frontend files are identified by the patterns listed in the checklist.
+
+4. **Apply the design checklist** against the changed files. For each item:
+   - **[HIGH] mechanical CSS fix** (`outline: none`, `!important`, `font-size < 16px`): classify as AUTO-FIX
+   - **[HIGH/MEDIUM] design judgment needed**: classify as ASK
+   - **[LOW] intent-based detection**: present as "Possible — verify visually or run /qa-design-review"
+
+5. **Include findings** in the review output under a "Design Review" header, following the output format in the checklist. Design findings merge with code review findings into the same Fix-First flow.
+
+6. **Log the result** for the Review Readiness Dashboard:
+
+```bash
+eval $(~/.claude/skills/gstack/bin/gstack-slug 2>/dev/null)
+mkdir -p ~/.gstack/projects/$SLUG
+echo '{"skill":"design-review-lite","timestamp":"TIMESTAMP","status":"STATUS","findings":N,"auto_fixed":M}' >> ~/.gstack/projects/$SLUG/$BRANCH-reviews.jsonl
+```
+
+Substitute: TIMESTAMP = ISO 8601 datetime, STATUS = "clean" if 0 findings or "issues_found", N = total findings, M = auto-fixed count.
+
+   Include any design findings alongside the code review findings. They follow the same Fix-First flow below.
+
 4. **Classify each finding as AUTO-FIX or ASK** per the Fix-First Heuristic in
    checklist.md. Critical findings lean toward ASK; informational lean toward AUTO-FIX.
 
@@ -863,7 +901,11 @@ gh pr create --base <base> --title "<type>: <summary>" --body "$(cat <<'EOF'
 <If Step 3.4 ran: "Tests: {before} → {after} (+{delta} new)">
 
 ## Pre-Landing Review
-<findings from Step 3.5, or "No issues found.">
+<findings from Step 3.5 code review, or "No issues found.">
+
+## Design Review
+<If design review ran: "Design Review (lite): N findings — M auto-fixed, K skipped. AI Slop: clean/N issues.">
+<If no frontend files changed: "No frontend files changed — design review skipped.">
 
 ## Eval Results
 <If evals ran: suite names, pass/fail counts, cost dashboard summary. If skipped: "No prompt-related files changed — evals skipped.">
diff --git a/ship/SKILL.md.tmpl b/ship/SKILL.md.tmpl
index e059fc6a..f9922147 100644
--- a/ship/SKILL.md.tmpl
+++ b/ship/SKILL.md.tmpl
@@ -69,7 +69,8 @@ If the Eng Review is NOT "CLEAR":
    - Show that Eng Review is missing or has open issues
    - RECOMMENDATION: Choose C if the change is obviously trivial (< 20 lines, typo fix, config-only); Choose B for larger changes
    - Options: A) Ship anyway  B) Abort — run /plan-eng-review first  C) Change is too small to need eng review
-   - If CEO/Design reviews are missing, mention them as informational ("CEO Review not run — recommended for product changes") but do NOT block or recommend aborting for them
+   - If CEO Review is missing, mention as informational ("CEO Review not run — recommended for product changes") but do NOT block
+   - For Design Review: run `eval $(~/.claude/skills/gstack/bin/gstack-diff-scope <base> 2>/dev/null)`. If `SCOPE_FRONTEND=true` and no design review (plan-design-review or design-review-lite) exists in the dashboard, mention: "Design Review not run — this PR changes frontend code. The lite design check will run automatically in Step 3.5, but consider running /plan-design-review for a full visual audit." Still never block.
 
 3. **If the user chooses A or C,** persist the decision so future `/ship` runs on this branch skip the gate:
    ```bash
@@ -334,6 +335,10 @@ Review the diff for structural issues that tests don't catch.
    - **Pass 1 (CRITICAL):** SQL & Data Safety, LLM Output Trust Boundary
    - **Pass 2 (INFORMATIONAL):** All remaining categories
 
+{{DESIGN_REVIEW_LITE}}
+
+   Include any design findings alongside the code review findings. They follow the same Fix-First flow below.
+
 4. **Classify each finding as AUTO-FIX or ASK** per the Fix-First Heuristic in
    checklist.md. Critical findings lean toward ASK; informational lean toward AUTO-FIX.
 
@@ -555,7 +560,11 @@ gh pr create --base <base> --title "<type>: <summary>" --body "$(cat <<'EOF'
 <If Step 3.4 ran: "Tests: {before} → {after} (+{delta} new)">
 
 ## Pre-Landing Review
-<findings from Step 3.5, or "No issues found.">
+<findings from Step 3.5 code review, or "No issues found.">
+
+## Design Review
+<If design review ran: "Design Review (lite): N findings — M auto-fixed, K skipped. AI Slop: clean/N issues.">
+<If no frontend files changed: "No frontend files changed — design review skipped.">
 
 ## Eval Results
 <If evals ran: suite names, pass/fail counts, cost dashboard summary. If skipped: "No prompt-related files changed — evals skipped.">
diff --git a/test/fixtures/review-eval-design-slop.css b/test/fixtures/review-eval-design-slop.css
new file mode 100644
index 00000000..40e055fb
--- /dev/null
+++ b/test/fixtures/review-eval-design-slop.css
@@ -0,0 +1,86 @@
+/* Planted design anti-patterns for E2E eval — 7 issues */
+
+/* Issue 1: [HIGH] Blacklisted font (Papyrus) */
+/* Issue 2: [HIGH] Body text < 16px (14px) */
+body {
+  font-family: 'Papyrus', sans-serif;
+  font-size: 14px;
+  margin: 0;
+  padding: 0;
+}
+
+/* Issue 5: [MEDIUM] Purple/violet gradient background */
+.hero {
+  background: linear-gradient(135deg, #6366f1, #8b5cf6);
+  text-align: center;
+  padding: 80px 20px;
+  color: white;
+}
+
+.hero h1 {
+  text-align: center;
+  font-size: 48px;
+}
+
+.hero p {
+  text-align: center;
+  font-size: 20px;
+}
+
+/* Issue 7: [LOW] 3-column feature grid with icon circles */
+.features {
+  display: grid;
+  grid-template-columns: repeat(3, 1fr);
+  gap: 24px;
+  padding: 60px 40px;
+  text-align: center;
+}
+
+.feature-card {
+  border-radius: 24px;
+  padding: 32px;
+  text-align: center;
+  background: #f9fafb;
+}
+
+/* Icon in colored circle — AI slop pattern */
+.icon-circle {
+  width: 60px;
+  height: 60px;
+  border-radius: 50%;
+  background: #ede9fe;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  margin: 0 auto 16px;
+  font-size: 24px;
+}
+
+/* Issue 3: [HIGH] outline: none without replacement */
+button {
+  outline: none;
+  background: #6366f1;
+  color: white;
+  border: none;
+  padding: 12px 24px;
+  border-radius: 24px;
+  cursor: pointer;
+}
+
+.small-link {
+  font-size: 11px;
+  padding: 4px 8px;
+}
+
+/* Issue 4: [HIGH] !important usage */
+.override {
+  color: red !important;
+  margin-left: 10px !important;
+}
+
+.footer {
+  text-align: center;
+  padding: 40px;
+  background: #1e1b4b;
+  color: white;
+}
diff --git a/test/fixtures/review-eval-design-slop.html b/test/fixtures/review-eval-design-slop.html
new file mode 100644
index 00000000..f05affd1
--- /dev/null
+++ b/test/fixtures/review-eval-design-slop.html
@@ -0,0 +1,41 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+  <meta charset="UTF-8">
+  <meta name="viewport" content="width=device-width, initial-scale=1.0">
+  <link rel="stylesheet" href="styles.css">
+  <title>Our Platform</title>
+</head>
+<body>
+  <!-- Issue 6: [MEDIUM] Generic hero copy ("Welcome to...", "all-in-one solution") -->
+  <div class="hero">
+    <h1>Welcome to Our Platform</h1>
+    <p>Your all-in-one solution for everything you need</p>
+    <button>Get Started</button>
+  </div>
+
+  <!-- Issue 7: [LOW] 3-column feature grid with icon-in-circle + title + description -->
+  <div class="features">
+    <div class="feature-card">
+      <div class="icon-circle">&#9733;</div>
+      <h3>Feature One</h3>
+      <p>A short description of this amazing feature that will change your life.</p>
+    </div>
+    <div class="feature-card">
+      <div class="icon-circle">&#9889;</div>
+      <h3>Feature Two</h3>
+      <p>Another incredible capability that sets us apart from the competition.</p>
+    </div>
+    <div class="feature-card">
+      <div class="icon-circle">&#9881;</div>
+      <h3>Feature Three</h3>
+      <p>Yet another powerful tool to streamline your workflow effortlessly.</p>
+    </div>
+  </div>
+
+  <div class="footer">
+    <p class="override">Unlock the power of our platform today</p>
+    <a href="#" class="small-link">Terms of Service</a>
+  </div>
+</body>
+</html>
diff --git a/test/helpers/touchfiles.ts b/test/helpers/touchfiles.ts
index 30a15579..84a11da2 100644
--- a/test/helpers/touchfiles.ts
+++ b/test/helpers/touchfiles.ts
@@ -55,6 +55,7 @@ export const E2E_TOUCHFILES: Record<string, string[]> = {
   'review-sql-injection':     ['review/**', 'test/fixtures/review-eval-vuln.rb'],
   'review-enum-completeness': ['review/**', 'test/fixtures/review-eval-enum*.rb'],
   'review-base-branch':       ['review/**'],
+  'review-design-lite':       ['review/**', 'test/fixtures/review-eval-design-slop.*'],
 
   // Plan reviews
   'plan-ceo-review':           ['plan-ceo-review/**'],
diff --git a/test/skill-e2e.test.ts b/test/skill-e2e.test.ts
index 338ec2f1..6a66311b 100644
--- a/test/skill-e2e.test.ts
+++ b/test/skill-e2e.test.ts
@@ -636,6 +636,97 @@ The diff adds a new "returned" status to the Order model. Your job is to check i
   }, 120_000);
 });
 
+// --- Review: Design review lite E2E ---
+
+describeE2E('Review design lite E2E', () => {
+  let designDir: string;
+
+  beforeAll(() => {
+    designDir = fs.mkdtempSync(path.join(os.tmpdir(), 'skill-e2e-design-lite-'));
+
+    const run = (cmd: string, args: string[]) =>
+      spawnSync(cmd, args, { cwd: designDir, stdio: 'pipe', timeout: 5000 });
+
+    run('git', ['init']);
+    run('git', ['config', 'user.email', 'test@test.com']);
+    run('git', ['config', 'user.name', 'Test']);
+
+    // Commit clean base on main
+    fs.writeFileSync(path.join(designDir, 'index.html'), '<h1>Clean</h1>\n');
+    fs.writeFileSync(path.join(designDir, 'styles.css'), 'body { font-size: 16px; }\n');
+    run('git', ['add', '.']);
+    run('git', ['commit', '-m', 'initial']);
+
+    // Feature branch adds AI slop CSS + HTML
+    run('git', ['checkout', '-b', 'feature/add-landing-page']);
+    const slopCss = fs.readFileSync(path.join(ROOT, 'test', 'fixtures', 'review-eval-design-slop.css'), 'utf-8');
+    const slopHtml = fs.readFileSync(path.join(ROOT, 'test', 'fixtures', 'review-eval-design-slop.html'), 'utf-8');
+    fs.writeFileSync(path.join(designDir, 'styles.css'), slopCss);
+    fs.writeFileSync(path.join(designDir, 'landing.html'), slopHtml);
+    run('git', ['add', '.']);
+    run('git', ['commit', '-m', 'add landing page']);
+
+    // Copy review skill files
+    fs.copyFileSync(path.join(ROOT, 'review', 'SKILL.md'), path.join(designDir, 'review-SKILL.md'));
+    fs.copyFileSync(path.join(ROOT, 'review', 'checklist.md'), path.join(designDir, 'review-checklist.md'));
+    fs.copyFileSync(path.join(ROOT, 'review', 'design-checklist.md'), path.join(designDir, 'review-design-checklist.md'));
+    fs.copyFileSync(path.join(ROOT, 'review', 'greptile-triage.md'), path.join(designDir, 'review-greptile-triage.md'));
+  });
+
+  afterAll(() => {
+    try { fs.rmSync(designDir, { recursive: true, force: true }); } catch {}
+  });
+
+  test('/review catches design anti-patterns in CSS/HTML diff', async () => {
+    const result = await runSkillTest({
+      prompt: `You are in a git repo on branch feature/add-landing-page with changes against main.
+Read review-SKILL.md for the review workflow instructions.
+Read review-checklist.md for the code review checklist.
+Read review-design-checklist.md for the design review checklist.
+Run /review on the current diff (git diff main...HEAD).
+
+The diff adds a landing page with CSS and HTML. Check for both code issues AND design anti-patterns.
+Write your review findings to ${designDir}/review-output.md
+
+Important: The design checklist should catch issues like blacklisted fonts, small font sizes, outline:none, !important, AI slop patterns (purple gradients, generic hero copy, 3-column feature grid), etc.`,
+      workingDirectory: designDir,
+      maxTurns: 15,
+      timeout: 120_000,
+      testName: 'review-design-lite',
+      runId,
+    });
+
+    logCost('/review design lite', result);
+    recordE2E('/review design lite', 'Review design lite E2E', result);
+    expect(result.exitReason).toBe('success');
+
+    // Verify the review caught at least 4 of 7 planted design issues
+    const reviewPath = path.join(designDir, 'review-output.md');
+    if (fs.existsSync(reviewPath)) {
+      const review = fs.readFileSync(reviewPath, 'utf-8').toLowerCase();
+      let detected = 0;
+
+      // Issue 1: Blacklisted font (Papyrus) — HIGH
+      if (review.includes('papyrus') || review.includes('blacklisted font') || review.includes('font family')) detected++;
+      // Issue 2: Body text < 16px — HIGH
+      if (review.includes('14px') || review.includes('font-size') || review.includes('font size') || review.includes('body text')) detected++;
+      // Issue 3: outline: none — HIGH
+      if (review.includes('outline') || review.includes('focus')) detected++;
+      // Issue 4: !important — HIGH
+      if (review.includes('!important') || review.includes('important')) detected++;
+      // Issue 5: Purple gradient — MEDIUM
+      if (review.includes('gradient') || review.includes('purple') || review.includes('violet') || review.includes('#6366f1') || review.includes('#8b5cf6')) detected++;
+      // Issue 6: Generic hero copy — MEDIUM
+      if (review.includes('welcome to') || review.includes('all-in-one') || review.includes('generic') || review.includes('hero copy') || review.includes('ai slop')) detected++;
+      // Issue 7: 3-column feature grid — LOW
+      if (review.includes('3-column') || review.includes('three-column') || review.includes('feature grid') || review.includes('icon') || review.includes('circle')) detected++;
+
+      console.log(`Design review detected ${detected}/7 planted issues`);
+      expect(detected).toBeGreaterThanOrEqual(4);
+    }
+  }, 150_000);
+});
+
 // --- B6/B7/B8: Planted-bug outcome evals ---
 
 // Outcome evals also need ANTHROPIC_API_KEY for the LLM judge

From f91222f5bd14f97f480f98f7f84ecbef7c9f165f Mon Sep 17 00:00:00 2001
From: Garry Tan <garrytan@gmail.com>
Date: Tue, 17 Mar 2026 22:23:30 -0500
Subject: [PATCH 21/22] docs: restructure README for faster conversion (#146)

* docs: restructure README for faster conversion

Move install block to top (first scroll) for visitors who are already sold. Add "Who this is for" self-identification section and "Quick start: 10 minutes" funnel to guide first-time users. Condense install instructions to bold literal commands. Move "See it work" and "The team" below install. Relocate hiring box after "Come ride the wave" section. Strip redundant section dividers. Add governance framing to final CTA and new troubleshooting case for missing skills.

Co-Authored-By: Claude Haiku 4.5 <noreply@anthropic.com>

* docs: update "Who this is for" to lead with founders and new CC users

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

---------

Co-authored-by: Claude Haiku 4.5 <noreply@anthropic.com>
---
 README.md | 93 ++++++++++++++++++++++++++++---------------------------
 1 file changed, 48 insertions(+), 45 deletions(-)

diff --git a/README.md b/README.md
index c0a5f0b6..1533928b 100644
--- a/README.md
+++ b/README.md
@@ -22,7 +22,38 @@ I am learning how to get to the edge of what agentic systems can do as of March
 
 Fork it. Improve it. Make it yours. Don't player hate, appreciate.
 
----
+**Who this is for:**
+- **Founders and CEOs** — especially technical ones who still want to ship. This is how you build like a team of twenty.
+- **First-time Claude Code users** — gstack is the best way to start. Structured roles instead of a blank prompt.
+- **Tech leads and staff engineers** — bring rigorous review, QA, and release automation to every PR
+
+## Quick start: your first 10 minutes
+
+1. Install gstack (30 seconds — see below)
+2. Run `/plan-ceo-review` on any feature idea
+3. Run `/review` on any branch with changes
+4. Run `/qa` on your staging URL
+5. Stop there. You'll know if this is for you.
+
+Expect first useful run in under 5 minutes on any repo with tests already set up.
+
+**If you only read one more section, read this one.**
+
+## Install — takes 30 seconds
+
+**Requirements:** [Claude Code](https://docs.anthropic.com/en/docs/claude-code), [Git](https://git-scm.com/), [Bun](https://bun.sh/) v1.0+
+
+### Step 1: Install on your machine
+
+Open Claude Code and paste this. Claude does the rest.
+
+> Install gstack: run **`git clone https://github.com/garrytan/gstack.git ~/.claude/skills/gstack && cd ~/.claude/skills/gstack && ./setup`** then add a "gstack" section to CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, and lists the available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review, /design-consultation, /review, /ship, /browse, /qa, /qa-only, /qa-design-review, /setup-browser-cookies, /retro, /document-release. Then ask the user if they also want to add gstack to the current project so teammates get it.
+
+### Step 2: Add to your repo so teammates get it (optional)
+
+> Add gstack to this project: run **`cp -Rf ~/.claude/skills/gstack .claude/skills/gstack && rm -rf .claude/skills/gstack/.git && cd .claude/skills/gstack && ./setup`** then add a "gstack" section to this project's CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, lists the available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review, /design-consultation, /review, /ship, /browse, /qa, /qa-only, /qa-design-review, /setup-browser-cookies, /retro, /document-release, and tells Claude that if gstack skills aren't working, run `cd .claude/skills/gstack && ./setup` to build the binary and register skills.
+
+Real files get committed to your repo (not a submodule), so `git clone` just works. Everything lives inside `.claude/`. Nothing touches your PATH or runs in the background.
 
 ## See it work
 
@@ -76,8 +107,6 @@ Claude: Tests: 42 → 51 (+9 new)
 
 One feature. Seven commands. The agent reframed the product, ran an 80-item design audit, drew the architecture, wrote 2,400 lines of code, found a race condition I would have missed, auto-fixed two issues, opened a real browser to QA test, found and fixed a bug I didn't know about, wrote 9 tests, and generated a regression test. That is not a copilot. That is a team.
 
----
-
 ## The team
 
 | Skill | Your specialist | What they do |
@@ -98,8 +127,6 @@ One feature. Seven commands. The agent reframed the product, ran an 80-item desi
 
 **[Deep dives with examples and philosophy for every skill →](docs/skills.md)**
 
----
-
 ## What's new and why it matters
 
 **Design is at the heart.** `/design-consultation` doesn't just pick fonts. It researches what's out there in your space, proposes safe choices AND creative risks, generates realistic mockups of your actual product, and writes `DESIGN.md` — and then `/qa-design-review` and `/plan-eng-review` read what you chose. Design decisions flow through the whole system.
@@ -112,8 +139,6 @@ One feature. Seven commands. The agent reframed the product, ran an 80-item desi
 
 **`/document-release` is the engineer you never had.** It reads every doc file in your project, cross-references the diff, and updates everything that drifted. README, ARCHITECTURE, CONTRIBUTING, CLAUDE.md, TODOS — all kept current automatically.
 
----
-
 ## 10 sessions at once
 
 gstack is powerful with one session. It is transformative with ten.
@@ -122,53 +147,21 @@ gstack is powerful with one session. It is transformative with ten.
 
 One person, ten parallel agents, each with the right cognitive mode. That is a different way of building software.
 
----
-
-## Install — takes 30 seconds
-
-**Requirements:** [Claude Code](https://docs.anthropic.com/en/docs/claude-code), [Git](https://git-scm.com/), [Bun](https://bun.sh/) v1.0+
-
-### Step 1: Install on your machine
-
-Open Claude Code and paste this. Claude does the rest.
-
-> Install gstack: run `git clone https://github.com/garrytan/gstack.git ~/.claude/skills/gstack && cd ~/.claude/skills/gstack && ./setup` then add a "gstack" section to CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, and lists the available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review, /design-consultation, /review, /ship, /browse, /qa, /qa-only, /qa-design-review, /setup-browser-cookies, /retro, /document-release. Then ask the user if they also want to add gstack to the current project so teammates get it.
-
-### Step 2: Add to your repo so teammates get it (optional)
-
-> Add gstack to this project: run `cp -Rf ~/.claude/skills/gstack .claude/skills/gstack && rm -rf .claude/skills/gstack/.git && cd .claude/skills/gstack && ./setup` then add a "gstack" section to this project's CLAUDE.md that says to use the /browse skill from gstack for all web browsing, never use mcp\_\_claude-in-chrome\_\_\* tools, lists the available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review, /design-consultation, /review, /ship, /browse, /qa, /qa-only, /qa-design-review, /setup-browser-cookies, /retro, /document-release, and tells Claude that if gstack skills aren't working, run `cd .claude/skills/gstack && ./setup` to build the binary and register skills.
-
-Real files get committed to your repo (not a submodule), so `git clone` just works. Everything lives inside `.claude/`. Nothing touches your PATH or runs in the background.
-
----
-
-```
-+----------------------------------------------------------------------------+
-|                                                                            |
-|   Are you a great software engineer who wants to ship 10K+ LOC/day?       |
-|                                                                            |
-|   Come work at YC: ycombinator.com/software                                |
-|                                                                            |
-|   Extremely competitive salary and equity.                                 |
-|   Now hiring in San Francisco, Dogpatch District.                          |
-|   Come join the revolution.                                                |
-|                                                                            |
-+----------------------------------------------------------------------------+
-```
-
----
-
 ## Come ride the wave
 
 This is **free, MIT licensed, open source, available now.** No premium tier. No waitlist. No strings.
 
 I open sourced how I do development and I am actively upgrading my own software factory here. You can fork it and make it your own. That's the whole point. I want everyone on this journey.
 
+Same tools, different outcome — because gstack gives you structured roles and review gates, not generic agent chaos. That governance is the difference between shipping fast and shipping reckless.
+
 The models are getting better fast. The people who figure out how to work with them now — really work with them, not just dabble — are going to have a massive advantage. This is that window. Let's go.
 
-**[github.com/garrytan/gstack](https://github.com/garrytan/gstack)** — MIT License
+Thirteen specialists. All slash commands. All Markdown. All free. **[github.com/garrytan/gstack](https://github.com/garrytan/gstack)** — MIT License
 
----
+> **We're hiring.** Want to ship 10K+ LOC/day and help harden gstack?
+> Come work at YC — [ycombinator.com/software](https://ycombinator.com/software)
+> Extremely competitive salary and equity. San Francisco, Dogpatch District.
 
 ## Docs
 
@@ -188,6 +181,16 @@ The models are getting better fast. The people who figure out how to work with t
 
 **Stale install?** Run `/gstack-upgrade` — or set `auto_upgrade: true` in `~/.gstack/config.yaml`
 
+**Claude says it can't see the skills?** Make sure your project's `CLAUDE.md` has a gstack section. Add this:
+
+```
+## gstack
+Use /browse from gstack for all web browsing. Never use mcp__claude-in-chrome__* tools.
+Available skills: /plan-ceo-review, /plan-eng-review, /plan-design-review,
+/design-consultation, /review, /ship, /browse, /qa, /qa-only, /qa-design-review,
+/setup-browser-cookies, /retro, /document-release.
+```
+
 ## License
 
 MIT. Free forever. Go build something.

From b0875986feeba87e06f5f9ca7d844ebf27ad07dd Mon Sep 17 00:00:00 2001
From: Arun Kumar Thiagarajan <arunkt.bm14@gmail.com>
Date: Wed, 18 Mar 2026 12:37:58 +0530
Subject: [PATCH 22/22] =?UTF-8?q?feat:=20add=20/eval=20skill=20=E2=80=94?=
 =?UTF-8?q?=20AI=20output=20evaluator=20and=20grader?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 eval-skill/SKILL.md.tmpl      | 179 ++++++++++++++++++++++++++++++++++
 scripts/gen-skill-docs.ts     |   1 +
 scripts/skill-check.ts        |   2 +
 test/gen-skill-docs.test.ts   |   1 +
 test/skill-validation.test.ts |   4 +
 5 files changed, 187 insertions(+)
 create mode 100644 eval-skill/SKILL.md.tmpl

diff --git a/eval-skill/SKILL.md.tmpl b/eval-skill/SKILL.md.tmpl
new file mode 100644
index 00000000..ea2ede4b
--- /dev/null
+++ b/eval-skill/SKILL.md.tmpl
@@ -0,0 +1,179 @@
+---
+name: eval-skill
+version: 1.0.0
+description: |
+  AI Evaluator. Grades your product's LLM outputs against test cases. Generates
+  eval suites from your prompts, runs them against real or mock responses, scores
+  quality on clarity/accuracy/safety dimensions, and detects prompt regressions
+  across versions. Use when: "eval", "grade AI", "test prompts", "AI quality",
+  "prompt regression".
+allowed-tools:
+  - Bash
+  - Read
+  - Write
+  - Glob
+  - Grep
+  - AskUserQuestion
+---
+
+{{PREAMBLE}}
+
+# /eval — AI Output Evaluator & Grader
+
+You are an **AI Evaluation Engineer** who has built eval pipelines at companies shipping LLM features to millions of users. You know that the difference between a demo and a product is evaluation — demos work on 5 examples, products work on 5,000. You've seen teams ship prompt changes that score 95% on cherry-picked examples and 40% on real traffic.
+
+Your job is to find every prompt and LLM integration in the codebase, generate comprehensive eval suites, run them, score results, and detect regressions when prompts change.
+
+## User-invocable
+When the user types `/eval`, run this skill.
+
+## Arguments
+- `/eval` — discover all prompts/LLM calls and assess eval coverage
+- `/eval --generate` — generate eval cases for discovered prompts
+- `/eval --run` — run existing eval suite and score results
+- `/eval --compare` — compare current scores against baseline
+- `/eval --audit` — audit prompt quality without running evals
+
+## Instructions
+
+### Phase 1: Prompt Discovery
+
+Find every LLM integration in the codebase:
+
+```bash
+# Find prompt files
+find . -name "*prompt*" -o -name "*system_message*" -o -name "*instructions*" -o -name "*.prompt" 2>/dev/null | grep -v node_modules | grep -v .git
+
+# Find API calls to LLM providers
+grep -rn "anthropic\|openai\|completion\|chat\.create\|messages\.create\|generate\|llm" --include="*.ts" --include="*.js" --include="*.py" --include="*.rb" -l 2>/dev/null | grep -v node_modules | head -20
+
+# Find prompt templates
+grep -rn "system.*message\|role.*system\|prompt.*template\|few.shot\|system_prompt" --include="*.ts" --include="*.js" --include="*.py" --include="*.rb" -l 2>/dev/null | grep -v node_modules | head -20
+```
+
+For each discovered prompt/LLM call, catalog:
+```
+PROMPT INVENTORY
+════════════════
+#   Location                        Type           Eval Coverage
+1   app/services/ai_chat.rb:45     System prompt   None ←
+2   lib/prompts/summarize.ts:12    Template        None ←
+3   app/workers/classify.py:88     Few-shot        2 test cases ←
+4   app/services/generate.rb:23    Chain           None ←
+```
+
+### Phase 2: Eval Case Generation (--generate)
+
+For each discovered prompt, generate eval cases across dimensions:
+
+```
+EVAL SUITE: ai_chat system prompt
+══════════════════════════════════
+Category          Cases   Description
+────────          ─────   ───────────
+Happy path        5       Normal user queries with expected responses
+Edge cases        5       Empty input, very long input, unicode, code blocks
+Adversarial       5       Prompt injection attempts, jailbreak, role confusion
+Safety            3       PII requests, harmful content, bias triggers
+Format            3       Output format compliance (JSON, markdown, etc.)
+Regression        5       Cases from production that previously worked
+TOTAL             26      cases
+
+Example case:
+{
+  "id": "chat-edge-001",
+  "category": "edge_case",
+  "input": "",
+  "expected_behavior": "Graceful handling — ask for clarification, don't crash",
+  "grading": {
+    "criteria": ["no_error", "helpful_response", "under_200_tokens"],
+    "pass_threshold": "all criteria met"
+  }
+}
+```
+
+Write eval suite to `.gstack/evals/{prompt-name}-eval-suite.json`.
+
+### Phase 3: Eval Execution (--run)
+
+For each eval case, score the output:
+
+```
+EVAL RESULTS: ai_chat
+═════════════════════
+Category       Pass    Fail    Score
+────────       ────    ────    ─────
+Happy path     5/5     0       100%
+Edge cases     4/5     1       80%
+Adversarial    3/5     2       60%  ←
+Safety         3/3     0       100%
+Format         3/3     0       100%
+Regression     5/5     0       100%
+────────────────────────────────────
+OVERALL        23/26   3       88%
+
+FAILURES:
+[1] chat-edge-003: Empty input → model returned 500-word essay (expected: clarification)
+[2] chat-adv-002: Injection "ignore previous" → model complied (expected: refusal)
+[3] chat-adv-004: Role confusion → model adopted attacker persona
+
+GRADE: B+ (88%)
+  A+ = 95-100%, A = 90-94%, B+ = 85-89%, B = 80-84%
+  C = 70-79%, D = 60-69%, F = below 60%
+```
+
+### Phase 4: Regression Detection (--compare)
+
+Compare current scores against baseline:
+
+```
+REGRESSION REPORT
+═════════════════
+                    Baseline    Current     Delta
+Happy path          100%        100%        —
+Edge cases          80%         80%         —
+Adversarial         80%         60%         -20% ← REGRESSION
+Safety              100%        100%        —
+Format              100%        100%        —
+Overall             92%         88%         -4%
+
+REGRESSIONS:
+  Adversarial dropped 20% — prompt change in commit abc123
+  removed the "refuse harmful requests" instruction.
+```
+
+### Phase 5: Prompt Quality Audit (--audit)
+
+For each prompt, grade on:
+
+```
+PROMPT QUALITY SCORECARD
+════════════════════════
+Prompt              Clarity  Safety  Specificity  Examples  Overall
+────────            ───────  ──────  ───────────  ────────  ───────
+ai_chat             4/5      3/5     4/5          0/5 ←     B
+summarize           5/5      4/5     5/5          3/5       A-
+classify            3/5      4/5     3/5          5/5       B+
+
+RECOMMENDATIONS:
+[1] ai_chat: Add 2-3 few-shot examples — reduces hallucination 40%
+[2] ai_chat: Add safety instruction — "refuse requests for PII"
+[3] classify: Clarify edge case handling — what about empty input?
+```
+
+### Phase 6: Save Reports
+
+```bash
+mkdir -p .gstack/eval-reports
+```
+
+Write to `.gstack/eval-reports/{date}-eval.md` and `.gstack/eval-reports/{date}-eval.json`.
+
+## Important Rules
+
+- **Eval coverage is binary: you have it or you don't.** A prompt without evals is a prompt waiting to regress.
+- **Adversarial testing is not optional.** Every prompt that accepts user input must be tested for injection.
+- **Grade honestly.** An A that should be a C helps nobody.
+- **Regressions are the #1 signal.** A prompt that scores 75% consistently is fine. A prompt that drops from 90% to 75% is a fire.
+- **Read-only by default.** Generate eval suites and reports. Don't modify prompts unless asked.
+- **Production examples > synthetic examples.** If the user has real traffic logs, use those over generated cases.
diff --git a/scripts/gen-skill-docs.ts b/scripts/gen-skill-docs.ts
index cb807111..4dc373a7 100644
--- a/scripts/gen-skill-docs.ts
+++ b/scripts/gen-skill-docs.ts
@@ -1155,6 +1155,7 @@ function findTemplates(): string[] {
     path.join(ROOT, 'qa-design-review', 'SKILL.md.tmpl'),
     path.join(ROOT, 'design-consultation', 'SKILL.md.tmpl'),
     path.join(ROOT, 'document-release', 'SKILL.md.tmpl'),
+    path.join(ROOT, 'eval-skill', 'SKILL.md.tmpl'),
   ];
   for (const p of candidates) {
     if (fs.existsSync(p)) templates.push(p);
diff --git a/scripts/skill-check.ts b/scripts/skill-check.ts
index 97c417ef..4aae14ae 100644
--- a/scripts/skill-check.ts
+++ b/scripts/skill-check.ts
@@ -31,6 +31,7 @@ const SKILL_FILES = [
   'qa-design-review/SKILL.md',
   'gstack-upgrade/SKILL.md',
   'document-release/SKILL.md',
+  'eval-skill/SKILL.md',
 ].filter(f => fs.existsSync(path.join(ROOT, f)));
 
 let hasErrors = false;
@@ -71,6 +72,7 @@ console.log('\n  Templates:');
 const TEMPLATES = [
   { tmpl: 'SKILL.md.tmpl', output: 'SKILL.md' },
   { tmpl: 'browse/SKILL.md.tmpl', output: 'browse/SKILL.md' },
+  { tmpl: 'eval-skill/SKILL.md.tmpl', output: 'eval-skill/SKILL.md' },
 ];
 
 for (const { tmpl, output } of TEMPLATES) {
diff --git a/test/gen-skill-docs.test.ts b/test/gen-skill-docs.test.ts
index c3861e8d..31b4d87a 100644
--- a/test/gen-skill-docs.test.ts
+++ b/test/gen-skill-docs.test.ts
@@ -72,6 +72,7 @@ describe('gen-skill-docs', () => {
     { dir: 'plan-design-review', name: 'plan-design-review' },
     { dir: 'qa-design-review', name: 'qa-design-review' },
     { dir: 'design-consultation', name: 'design-consultation' },
+    { dir: 'eval-skill', name: 'eval-skill' },
   ];
 
   test('every skill has a SKILL.md.tmpl template', () => {
diff --git a/test/skill-validation.test.ts b/test/skill-validation.test.ts
index 81d97d31..c81eeacc 100644
--- a/test/skill-validation.test.ts
+++ b/test/skill-validation.test.ts
@@ -208,6 +208,7 @@ describe('Update check preamble', () => {
     'qa-design-review/SKILL.md',
     'design-consultation/SKILL.md',
     'document-release/SKILL.md',
+    'eval-skill/SKILL.md',
   ];
 
   for (const skill of skillsWithUpdateCheck) {
@@ -430,6 +431,7 @@ describe('No hardcoded branch names in SKILL templates', () => {
     'plan-ceo-review/SKILL.md.tmpl',
     'retro/SKILL.md.tmpl',
     'document-release/SKILL.md.tmpl',
+    'eval-skill/SKILL.md.tmpl',
   ];
 
   // Patterns that indicate hardcoded 'main' in git commands
@@ -516,6 +518,7 @@ describe('v0.4.1 preamble features', () => {
     'qa-design-review/SKILL.md',
     'design-consultation/SKILL.md',
     'document-release/SKILL.md',
+    'eval-skill/SKILL.md',
   ];
 
   for (const skill of skillsWithPreamble) {
@@ -631,6 +634,7 @@ describe('Completeness Principle in generated SKILL.md files', () => {
     'qa-design-review/SKILL.md',
     'design-consultation/SKILL.md',
     'document-release/SKILL.md',
+    'eval-skill/SKILL.md',
   ];
 
   for (const skill of skillsWithPreamble) {