From ebf6fba410ec466c7281c82ab8f7992d68fc2bf7 Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Thu, 1 Jan 2026 20:45:24 +0200
Subject: [PATCH 01/14] fix(background-task): remove unused lastMessage field
 from progress type

---
 src/tools/background-task/manager.ts      |  8 --------
 src/tools/background-task/types.ts        |  1 -
 tests/tools/background-task-types.test.ts | 15 +++++++++++++++
 3 files changed, 15 insertions(+), 9 deletions(-)
 create mode 100644 tests/tools/background-task-types.test.ts
diff --git a/src/tools/background-task/manager.ts b/src/tools/background-task/manager.ts
index 1a05c41..4ebb987 100644
--- a/src/tools/background-task/manager.ts
+++ b/src/tools/background-task/manager.ts
@@ -197,14 +197,6 @@ export class BackgroundTaskManager {
       output += `\n### Error\n${task.error}\n`;
     }
 
-    if (task.progress?.lastMessage) {
-      const preview =
-        task.progress.lastMessage.length > 200
-          ? `${task.progress.lastMessage.slice(0, 200)}...`
-          : task.progress.lastMessage;
-      output += `\n### Last Message Preview\n${preview}\n`;
-    }
-
     return output;
   }
 
diff --git a/src/tools/background-task/types.ts b/src/tools/background-task/types.ts
index 9d6b385..757865d 100644
--- a/src/tools/background-task/types.ts
+++ b/src/tools/background-task/types.ts
@@ -15,7 +15,6 @@ export interface BackgroundTask {
     toolCalls: number;
     lastTool?: string;
     lastUpdate: Date;
-    lastMessage?: string;
   };
 }
 
diff --git a/tests/tools/background-task-types.test.ts b/tests/tools/background-task-types.test.ts
new file mode 100644
index 0000000..f5f8441
--- /dev/null
+++ b/tests/tools/background-task-types.test.ts
@@ -0,0 +1,15 @@
+import { describe, it, expect } from "bun:test";
+
+describe("background-task types", () => {
+  it("should not have lastMessage in progress type", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/tools/background-task/types.ts", "utf-8");
+    expect(source).not.toContain("lastMessage");
+  });
+
+  it("should not reference lastMessage in manager", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/tools/background-task/manager.ts", "utf-8");
+    expect(source).not.toContain("lastMessage");
+  });
+});

From ab57cd1c6268ebbb5ed852c9204276807e5bd0f3 Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Thu, 1 Jan 2026 20:47:02 +0200
Subject: [PATCH 02/14] feat(project-initializer): update to use
 background_task fire-and-collect pattern

---
 src/agents/project-initializer.ts        | 112 ++++++++++++++++-------
 tests/agents/project-initializer.test.ts |  32 +++++++
 2 files changed, 112 insertions(+), 32 deletions(-)
 create mode 100644 tests/agents/project-initializer.test.ts

diff --git a/src/agents/project-initializer.ts b/src/agents/project-initializer.ts
index 328938f..9da543a 100644
--- a/src/agents/project-initializer.ts
+++ b/src/agents/project-initializer.ts
@@ -10,7 +10,7 @@ const PROMPT = `
 
   <critical-rule>
     MAXIMIZE PARALLELISM. Speed is critical.
-    - Spawn multiple agents simultaneously
+    - Fire ALL background tasks simultaneously
     - Run multiple tool calls in single message
     - Never wait for one thing when you can do many
   </critical-rule>
@@ -23,16 +23,33 @@ const PROMPT = `
     </outputs>
   </task>
 
-  <parallel-execution-strategy>
-    <phase name="1-discovery" parallel="true">
-      <description>Spawn ALL discovery tasks simultaneously</description>
-      <spawn-agents>
+  <background-tools>
+    <tool name="background_task">
+      Fire a subagent to run in background. Returns task_id immediately.
+      Parameters: description, prompt, agent (subagent type)
+      Example: background_task(description="Find entry points", prompt="Find all entry points", agent="codebase-locator")
+    </tool>
+    <tool name="background_output">
+      Get results from a background task. Use block=true to wait for completion.
+      Parameters: task_id, block (boolean), timeout (optional)
+      Example: background_output(task_id="abc123", block=true)
+    </tool>
+    <tool name="background_list">
+      List all background tasks and their status.
+      No parameters required.
+    </tool>
+  </background-tools>
+
+  <parallel-execution-strategy pattern="fire-and-collect">
+    <phase name="1-fire" description="Fire ALL tasks simultaneously">
+      <description>Launch ALL discovery agents + run tools in a SINGLE message</description>
+      <fire-agents>
         <agent name="codebase-locator">Find entry points, configs, main modules</agent>
         <agent name="codebase-locator">Find test files and test patterns</agent>
         <agent name="codebase-locator">Find linter, formatter, CI configs</agent>
         <agent name="codebase-analyzer">Analyze directory structure</agent>
         <agent name="pattern-finder">Find naming conventions across files</agent>
-      </spawn-agents>
+      </fire-agents>
       <parallel-tools>
         <tool>Glob for package.json, pyproject.toml, go.mod, Cargo.toml, etc.</tool>
         <tool>Glob for *.config.*, .eslintrc*, .prettierrc*, ruff.toml, etc.</tool>
@@ -41,13 +58,19 @@ const PROMPT = `
       </parallel-tools>
     </phase>
 
-    <phase name="2-deep-analysis" parallel="true">
-      <description>Analyze core modules in parallel</description>
-      <spawn-agents>
+    <phase name="2-collect" description="Collect all results">
+      <description>Use background_output(block=true) to collect each result</description>
+      <action>Collect results from all fired agents</action>
+      <action>Process tool results from phase 1</action>
+    </phase>
+
+    <phase name="3-deep-analysis" description="Fire deep analysis tasks">
+      <description>Based on discovery, fire more background tasks</description>
+      <fire-agents>
         <agent name="codebase-analyzer">Analyze core/domain logic</agent>
         <agent name="codebase-analyzer">Analyze API/entry points</agent>
         <agent name="codebase-analyzer">Analyze data layer</agent>
-      </spawn-agents>
+      </fire-agents>
       <parallel-tools>
         <tool>Read 5 core source files simultaneously</tool>
         <tool>Read 3 test files simultaneously</tool>
@@ -55,8 +78,9 @@ const PROMPT = `
       </parallel-tools>
     </phase>
 
-    <phase name="3-write" parallel="true">
-      <description>Write both files in parallel</description>
+    <phase name="4-collect-and-write" description="Collect and write output">
+      <description>Collect deep analysis results, then write both files</description>
+      <action>Collect all deep analysis results</action>
       <action>Write ARCHITECTURE.md</action>
       <action>Write CODE_STYLE.md</action>
     </phase>
@@ -66,23 +90,36 @@ const PROMPT = `
     <subagent name="codebase-locator" spawn="multiple">
       Fast file/pattern finder. Spawn multiple with different queries.
       Examples: "Find all entry points", "Find all config files", "Find test directories"
-      Invoke with: Task tool, subagent_type="codebase-locator"
+      
+      Background: background_task(description="Find entry points", prompt="Find all entry points and main files", agent="codebase-locator")
+      Fallback: Task(description="Find entry points", prompt="Find all entry points and main files", subagent_type="codebase-locator")
     </subagent>
     <subagent name="codebase-analyzer" spawn="multiple">
       Deep module analyzer. Spawn multiple for different areas.
       Examples: "Analyze src/core", "Analyze api layer", "Analyze database module"
-      Invoke with: Task tool, subagent_type="codebase-analyzer"
+      
+      Background: background_task(description="Analyze core", prompt="Analyze the core module", agent="codebase-analyzer")
+      Fallback: Task(description="Analyze core", prompt="Analyze the core module", subagent_type="codebase-analyzer")
     </subagent>
     <subagent name="pattern-finder" spawn="multiple">
       Pattern extractor. Spawn for different pattern types.
       Examples: "Find naming patterns", "Find error handling patterns", "Find async patterns"
-      Invoke with: Task tool, subagent_type="pattern-finder"
+      
+      Background: background_task(description="Find patterns", prompt="Find naming conventions", agent="pattern-finder")
+      Fallback: Task(description="Find patterns", prompt="Find naming conventions", subagent_type="pattern-finder")
     </subagent>
   </available-subagents>
 
+  <fallback-rule>
+    If background_task fails or is unavailable, fall back to Task() tool.
+    The Task tool provides synchronous subagent execution.
+    Example fallback: Task(description="Find entry points", prompt="Find all entry points", subagent_type="codebase-locator")
+  </fallback-rule>
+
   <critical-instruction>
-  You MUST use the Task tool to spawn subagents. Call multiple Task tools in a SINGLE message for parallelism.
-  Example: Task(description="Find entry points", prompt="Find all entry points and main files", subagent_type="codebase-locator")
+    Use background_task to fire subagents for TRUE parallelism.
+    Fire ALL background_task calls in a SINGLE message, then collect with background_output(block=true).
+    This is the fire-and-collect pattern - fire everything, then collect everything.
   </critical-instruction>
 
   <language-detection>
@@ -148,10 +185,10 @@ const PROMPT = `
 
   <rules>
     <category name="Speed">
-      <rule>ALWAYS spawn multiple agents in a SINGLE message</rule>
+      <rule>ALWAYS fire multiple background_task calls in a SINGLE message</rule>
       <rule>ALWAYS run multiple tool calls in a SINGLE message</rule>
       <rule>NEVER wait for one task when you can start others</rule>
-      <rule>Batch related queries into parallel agent spawns</rule>
+      <rule>Use fire-and-collect: fire all, then collect all</rule>
     </category>
 
     <category name="Analysis">
@@ -176,27 +213,38 @@ const PROMPT = `
     </category>
   </rules>
 
-  <execution-example>
-    <step description="Start with maximum parallelism">
-      In a SINGLE message, call Task tool multiple times AND run other tools:
-      - Task(description="Find entry points", prompt="Find all entry points and main files", subagent_type="codebase-locator")
-      - Task(description="Find configs", prompt="Find all config files (linters, formatters, build)", subagent_type="codebase-locator")
-      - Task(description="Find tests", prompt="Find test directories and test files", subagent_type="codebase-locator")
-      - Task(description="Analyze structure", prompt="Analyze the directory structure and organization", subagent_type="codebase-analyzer")
-      - Task(description="Find patterns", prompt="Find naming conventions used across the codebase", subagent_type="pattern-finder")
+  <execution-example pattern="fire-and-collect">
+    <step description="FIRE: Launch all discovery tasks simultaneously">
+      In a SINGLE message, fire ALL background_task calls AND run other tools:
+      - background_task(description="Find entry points", prompt="Find all entry points and main files", agent="codebase-locator") -> task_id_1
+      - background_task(description="Find configs", prompt="Find all config files (linters, formatters, build)", agent="codebase-locator") -> task_id_2
+      - background_task(description="Find tests", prompt="Find test directories and test files", agent="codebase-locator") -> task_id_3
+      - background_task(description="Analyze structure", prompt="Analyze the directory structure and organization", agent="codebase-analyzer") -> task_id_4
+      - background_task(description="Find patterns", prompt="Find naming conventions used across the codebase", agent="pattern-finder") -> task_id_5
       - Glob: package.json, pyproject.toml, go.mod, Cargo.toml, etc.
       - Glob: README*, ARCHITECTURE*, docs/*
     </step>
 
-    <step description="Parallel deep analysis">
-      Based on discovery, in a SINGLE message:
-      - Task for each major module: subagent_type="codebase-analyzer"
+    <step description="COLLECT: Gather all results">
+      In a SINGLE message, collect ALL results:
+      - background_output(task_id=task_id_1, block=true)
+      - background_output(task_id=task_id_2, block=true)
+      - background_output(task_id=task_id_3, block=true)
+      - background_output(task_id=task_id_4, block=true)
+      - background_output(task_id=task_id_5, block=true)
+    </step>
+
+    <step description="FIRE: Deep analysis based on discovery">
+      Based on discovery, in a SINGLE message fire more tasks:
+      - background_task for each major module: agent="codebase-analyzer"
       - Read multiple source files simultaneously
       - Read multiple test files simultaneously
     </step>
 
-    <step description="Parallel write">
-      Write ARCHITECTURE.md and CODE_STYLE.md
+    <step description="COLLECT and WRITE">
+      Collect deep analysis results, then write:
+      - Write ARCHITECTURE.md
+      - Write CODE_STYLE.md
     </step>
   </execution-example>
 </agent>
diff --git a/tests/agents/project-initializer.test.ts b/tests/agents/project-initializer.test.ts
new file mode 100644
index 0000000..f5cb790
--- /dev/null
+++ b/tests/agents/project-initializer.test.ts
@@ -0,0 +1,32 @@
+import { describe, it, expect } from "bun:test";
+
+describe("project-initializer agent", () => {
+  it("should use background_task instead of Task", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/project-initializer.ts", "utf-8");
+
+    expect(source).toContain("background_task");
+    expect(source).toContain("background_output");
+  });
+
+  it("should have fire-and-collect pattern documentation", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/project-initializer.ts", "utf-8");
+
+    expect(source).toContain("fire-and-collect");
+  });
+
+  it("should have fallback-rule section", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/project-initializer.ts", "utf-8");
+
+    expect(source).toContain("<fallback-rule>");
+  });
+
+  it("should have background-tools section", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/project-initializer.ts", "utf-8");
+
+    expect(source).toContain("<background-tools>");
+  });
+});

From 893adefee771071b7b2995debcbc156ef7bc8a68 Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Thu, 1 Jan 2026 20:47:09 +0200
Subject: [PATCH 03/14] feat(planner): update to use background_task
 fire-and-collect pattern

---
 src/agents/planner.ts        | 66 ++++++++++++++++++++++++++++--------
 tests/agents/planner.test.ts | 40 ++++++++++++++++++++++
 2 files changed, 92 insertions(+), 14 deletions(-)
 create mode 100644 tests/agents/planner.test.ts

diff --git a/src/agents/planner.ts b/src/agents/planner.ts
index ff32fd6..de0a400 100644
--- a/src/agents/planner.ts
+++ b/src/agents/planner.ts
@@ -13,13 +13,24 @@ Every task is bite-sized (2-5 minutes), with exact paths and complete code.
 
 <critical-rules>
   <rule>FOLLOW THE DESIGN: The brainstormer's design is the spec. Do not explore alternatives.</rule>
-  <rule>SUBAGENTS: Spawn for implementation details (paths, signatures, line numbers).</rule>
-  <rule>TOOLS (grep, read, etc.): Do NOT use directly - use subagents instead.</rule>
+  <rule>BACKGROUND TASKS: Use background_task for parallel research (fire-and-collect pattern).</rule>
+  <rule>TOOLS (grep, read, etc.): Do NOT use directly - use background subagents instead.</rule>
   <rule>Every code example MUST be complete - never write "add validation here"</rule>
   <rule>Every file path MUST be exact - never write "somewhere in src/"</rule>
   <rule>Follow TDD: failing test → verify fail → implement → verify pass → commit</rule>
 </critical-rules>
 
+<background-tools>
+  <tool name="background_task">Fire subagent tasks that run in parallel. Returns task_id immediately.</tool>
+  <tool name="background_output">Collect results from background tasks. Use block=true to wait for completion.</tool>
+  <tool name="background_list">List all background tasks and their status.</tool>
+</background-tools>
+
+<fallback-rule>
+If background_task fails or is unavailable, fall back to Task() for sequential execution.
+Always prefer background_task for parallel research, but Task() works as a reliable fallback.
+</fallback-rule>
+
 <research-scope>
 Brainstormer did conceptual research (architecture, patterns, approaches).
 Your research is IMPLEMENTATION-LEVEL only:
@@ -37,18 +48,19 @@ All research must serve the design - never second-guess design decisions.
 </library-research>
 
 <available-subagents>
-  <subagent name="codebase-locator" spawn="parallel">
+  <subagent name="codebase-locator" spawn="background">
     Find exact file paths needed for implementation.
     Examples: "Find exact path to UserService", "Find test directory structure"
   </subagent>
-  <subagent name="codebase-analyzer" spawn="parallel">
+  <subagent name="codebase-analyzer" spawn="background">
     Get exact signatures and types for code examples.
     Examples: "Get function signature for createUser", "Get type definition for UserConfig"
   </subagent>
-  <subagent name="pattern-finder" spawn="parallel">
+  <subagent name="pattern-finder" spawn="background">
     Find exact patterns to copy in code examples.
     Examples: "Find exact test setup pattern", "Find exact error handling in similar endpoint"
   </subagent>
+  <fallback>If background_task unavailable, use Task() with same subagent types.</fallback>
 </available-subagents>
 
 <inputs>
@@ -64,15 +76,20 @@ All research must serve the design - never second-guess design decisions.
   <action>Note any constraints or decisions made by brainstormer</action>
 </phase>
 
-<phase name="implementation-research">
-  <action>Spawn subagents in PARALLEL to gather exact details:</action>
-  <spawn-example>
-    In a SINGLE message, spawn:
-    - codebase-locator: "Find exact path to [component from design]"
-    - codebase-locator: "Find test file naming convention"
-    - codebase-analyzer: "Get exact signature for [function mentioned in design]"
-    - pattern-finder: "Find exact test setup pattern for [type of test]"
-  </spawn-example>
+<phase name="implementation-research" pattern="fire-and-collect">
+  <action>Fire background tasks AND library research in parallel:</action>
+  <fire-phase description="Launch all research simultaneously">
+    In a SINGLE message, fire:
+    - background_task(agent="codebase-locator", prompt="Find exact path to [component]")
+    - background_task(agent="codebase-analyzer", prompt="Get signature for [function]")
+    - background_task(agent="pattern-finder", prompt="Find test setup pattern")
+    - context7_resolve-library-id + context7_query-docs for API docs
+    - btca_ask for library internals when needed
+  </fire-phase>
+  <collect-phase description="Wait for all results">
+    - background_output(task_id=..., block=true) for each background task
+    - Combine all results for planning phase
+  </collect-phase>
   <rule>Only research what's needed to implement the design</rule>
   <rule>Never research alternatives to design decisions</rule>
 </phase>
@@ -164,6 +181,27 @@ git commit -m "feat(scope): add specific feature"
 </template>
 </output-format>
 
+<execution-example pattern="fire-and-collect">
+<step name="fire">
+// In a SINGLE message, fire all research tasks:
+background_task(agent="codebase-locator", prompt="Find UserService path")  // returns task_id_1
+background_task(agent="codebase-analyzer", prompt="Get createUser signature")  // returns task_id_2
+background_task(agent="pattern-finder", prompt="Find test setup pattern")  // returns task_id_3
+context7_resolve-library-id(libraryName="express")  // runs in parallel
+btca_ask(tech="express", question="middleware chain order")  // runs in parallel
+</step>
+<step name="collect">
+// Wait for all background tasks to complete:
+background_output(task_id=task_id_1, block=true)  // blocks until complete
+background_output(task_id=task_id_2, block=true)
+background_output(task_id=task_id_3, block=true)
+// context7 and btca_ask results already available from fire step
+</step>
+<step name="plan">
+// Use all collected results to write the implementation plan
+</step>
+</execution-example>
+
 <principles>
   <principle name="zero-context">Engineer knows nothing about our codebase</principle>
   <principle name="complete-code">Every code block is copy-paste ready</principle>
diff --git a/tests/agents/planner.test.ts b/tests/agents/planner.test.ts
new file mode 100644
index 0000000..070df4d
--- /dev/null
+++ b/tests/agents/planner.test.ts
@@ -0,0 +1,40 @@
+import { describe, it, expect } from "bun:test";
+
+describe("planner agent", () => {
+  it("should use background_task instead of Task for research", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/planner.ts", "utf-8");
+
+    expect(source).toContain("background_task");
+    expect(source).toContain("background_output");
+  });
+
+  it("should have fire-and-collect pattern documentation", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/planner.ts", "utf-8");
+
+    expect(source).toContain("fire-and-collect");
+  });
+
+  it("should have fallback-rule section", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/planner.ts", "utf-8");
+
+    expect(source).toContain("<fallback-rule>");
+  });
+
+  it("should have background-tools section", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/planner.ts", "utf-8");
+
+    expect(source).toContain("<background-tools>");
+  });
+
+  it("should mention running library research in parallel with agents", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/planner.ts", "utf-8");
+
+    expect(source).toContain("context7");
+    expect(source).toContain("btca_ask");
+  });
+});

From 49be9de9d6923ab49f2c92b8a98031df1120af33 Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Thu, 1 Jan 2026 20:47:23 +0200
Subject: [PATCH 04/14] feat(executor): update to use background_task
 fire-and-check pattern

---
 src/agents/executor.ts        | 141 ++++++++++++++++++++++------------
 tests/agents/executor.test.ts |  40 ++++++++++
 2 files changed, 130 insertions(+), 51 deletions(-)
 create mode 100644 tests/agents/executor.test.ts

diff --git a/src/agents/executor.ts b/src/agents/executor.ts
index 1e9a1cd..c5e0f97 100644
--- a/src/agents/executor.ts
+++ b/src/agents/executor.ts
@@ -6,16 +6,24 @@ export const executorAgent: AgentConfig = {
   model: "anthropic/claude-opus-4-5",
   temperature: 0.2,
   prompt: `<purpose>
-Execute plan tasks with maximum parallelism.
+Execute plan tasks with maximum parallelism using fire-and-check pattern.
 Each task gets its own implementer → reviewer cycle.
 Detect and parallelize independent tasks.
 </purpose>
 
-<workflow>
+<background-tools>
+You have access to background task management tools:
+- background_task: Fire a subagent to run in background, returns task_id immediately
+- background_output: Check status or get results from a background task
+- background_list: List all background tasks and their status
+</background-tools>
+
+<workflow pattern="fire-and-check">
 <step>Parse plan to extract individual tasks</step>
 <step>Analyze task dependencies to build execution graph</step>
 <step>Group tasks into parallel batches (independent tasks run together)</step>
-<step>For each batch: spawn implementer → reviewer per task IN PARALLEL</step>
+<step>Fire ALL implementers in batch as background_task</step>
+<step>Poll with background_list, start reviewer immediately when each implementer finishes</step>
 <step>Wait for batch to complete before starting dependent batch</step>
 <step>Aggregate results and report</step>
 </workflow>
@@ -35,83 +43,113 @@ Tasks are DEPENDENT (must be sequential) when:
 When uncertain, assume DEPENDENT (safer).
 </dependency-analysis>
 
-<execution-pattern>
-Example: 9 tasks where tasks 1-3 are independent, 4-6 depend on 1-3, 7-9 depend on 4-6
-
-Batch 1 (parallel):
-  - Spawn implementer for task 1 → reviewer
-  - Spawn implementer for task 2 → reviewer
-  - Spawn implementer for task 3 → reviewer
-  [Wait for all to complete]
-
-Batch 2 (parallel):
-  - Spawn implementer for task 4 → reviewer
-  - Spawn implementer for task 5 → reviewer
-  - Spawn implementer for task 6 → reviewer
-  [Wait for all to complete]
-
-Batch 3 (parallel):
-  - Spawn implementer for task 7 → reviewer
-  - Spawn implementer for task 8 → reviewer
-  - Spawn implementer for task 9 → reviewer
-  [Wait for all to complete]
+<execution-pattern name="fire-and-check">
+The fire-and-check pattern maximizes parallelism by:
+1. Firing all implementers as background tasks simultaneously
+2. Polling to detect completion as early as possible
+3. Starting each reviewer immediately when its implementer finishes
+4. Not waiting for all implementers before starting any reviewers
+
+Example: 3 independent tasks
+- Fire implementer 1, 2, 3 as background_task (all start immediately)
+- Poll with background_list
+- Task 2 finishes first → immediately start reviewer 2
+- Task 1 finishes → immediately start reviewer 1
+- Task 3 finishes → immediately start reviewer 3
+- Reviewers run in parallel as they're spawned
 </execution-pattern>
 
 <available-subagents>
-  <subagent name="implementer" spawn="parallel-per-task">
+  <subagent name="implementer">
     Executes ONE task from the plan.
     Input: Single task with context (which files, what to do).
     Output: Changes made and verification results for that task.
-    Invoke with: Task tool, subagent_type="implementer"
+    <invocation type="background">
+      background_task(description="Implement task 1", prompt="...", agent="implementer")
+    </invocation>
+    <invocation type="fallback">
+      Task(description="Implement task 1", prompt="...", subagent_type="implementer")
+    </invocation>
   </subagent>
-  <subagent name="reviewer" spawn="parallel-per-task">
+  <subagent name="reviewer">
     Reviews ONE task's implementation.
     Input: Single task's changes against its requirements.
     Output: APPROVED or CHANGES REQUESTED for that task.
-    Invoke with: Task tool, subagent_type="reviewer"
+    <invocation type="background">
+      background_task(description="Review task 1", prompt="...", agent="reviewer")
+    </invocation>
+    <invocation type="fallback">
+      Task(description="Review task 1", prompt="...", subagent_type="reviewer")
+    </invocation>
   </subagent>
 </available-subagents>
 
-<critical-instruction>
-You MUST use the Task tool to spawn implementer and reviewer subagents.
-Example: Task(description="Implement task 1", prompt="...", subagent_type="implementer")
-Do NOT try to implement or review yourself - delegate to subagents.
-</critical-instruction>
-
 <per-task-cycle>
 For each task:
-1. Spawn implementer with task details
-2. Wait for implementer to complete
-3. Spawn reviewer to check that task
-4. If reviewer requests changes: re-spawn implementer for fixes
+1. Fire implementer as background_task
+2. Poll until implementer completes
+3. Start reviewer immediately when implementer finishes
+4. If reviewer requests changes: fire new implementer for fixes
 5. Max 3 cycles per task before marking as blocked
 6. Report task status: DONE / BLOCKED
 </per-task-cycle>
 
-<parallel-spawning>
-Within a batch, spawn ALL implementers in a SINGLE message using the Task tool:
-
-Example for batch with tasks 1, 2, 3 - call Task tool 3 times in ONE message:
-- Task(description="Task 1", prompt="Execute task 1: [details]", subagent_type="implementer")
-- Task(description="Task 2", prompt="Execute task 2: [details]", subagent_type="implementer")
-- Task(description="Task 3", prompt="Execute task 3: [details]", subagent_type="implementer")
-
-Then after all complete, in ONE message call Task tool for reviewers:
-- Task(description="Review 1", prompt="Review task 1 implementation", subagent_type="reviewer")
-- Task(description="Review 2", prompt="Review task 2 implementation", subagent_type="reviewer")
-- Task(description="Review 3", prompt="Review task 3 implementation", subagent_type="reviewer")
-</parallel-spawning>
+<fire-and-check-loop>
+Within a batch:
+1. Fire ALL implementers as background_task in ONE message
+2. Enter polling loop:
+   a. Call background_list to check status
+   b. For each newly completed implementer:
+      - Get result with background_output
+      - Start reviewer immediately (as background_task)
+   c. For each newly completed reviewer:
+      - Check if APPROVED or CHANGES REQUESTED
+      - If changes needed and cycles < 3: fire new implementer
+   d. Repeat until all tasks in batch are done or blocked
+3. Move to next batch
+</fire-and-check-loop>
+
+<fallback-rule>
+If background_task fails or is unavailable, fall back to Task() tool:
+- Task(description="...", prompt="...", subagent_type="implementer")
+- Task(description="...", prompt="...", subagent_type="reviewer")
+The Task tool blocks until completion but still works correctly.
+</fallback-rule>
 
 <rules>
 <rule>Parse ALL tasks from plan before starting execution</rule>
 <rule>ALWAYS analyze dependencies before parallelizing</rule>
-<rule>Spawn parallel tasks in SINGLE message for true parallelism</rule>
+<rule>Fire parallel tasks as background_task for true parallelism</rule>
+<rule>Start reviewer immediately when its implementer finishes - don't wait for others</rule>
 <rule>Wait for entire batch before starting next batch</rule>
 <rule>Each task gets its own implement → review cycle</rule>
 <rule>Max 3 review cycles per task</rule>
 <rule>Continue with other tasks if one is blocked</rule>
 </rules>
 
+<execution-example pattern="fire-and-check">
+# Batch with tasks 1, 2, 3 (independent)
+
+## Step 1: Fire all implementers
+background_task(description="Task 1", prompt="Execute task 1: [details]", agent="implementer") → task_id_1
+background_task(description="Task 2", prompt="Execute task 2: [details]", agent="implementer") → task_id_2
+background_task(description="Task 3", prompt="Execute task 3: [details]", agent="implementer") → task_id_3
+
+## Step 2: Poll and react
+background_list() → shows task_id_2 completed
+background_output(task_id="task_id_2") → get result
+background_task(description="Review 2", prompt="Review task 2 implementation", agent="reviewer") → review_id_2
+
+background_list() → shows task_id_1, task_id_3 completed
+background_output(task_id="task_id_1") → get result
+background_output(task_id="task_id_3") → get result
+background_task(description="Review 1", prompt="Review task 1 implementation", agent="reviewer") → review_id_1
+background_task(description="Review 3", prompt="Review task 3 implementation", agent="reviewer") → review_id_3
+
+## Step 3: Continue polling until all reviews complete
+...
+</execution-example>
+
 <output-format>
 <template>
 ## Execution Complete
@@ -151,5 +189,6 @@ Then after all complete, in ONE message call Task tool for reviewers:
 <forbidden>Never skip reviewer for any task</forbidden>
 <forbidden>Never continue past 3 cycles for a single task</forbidden>
 <forbidden>Never report success if any task is blocked</forbidden>
+<forbidden>Never wait for all implementers before starting any reviewer</forbidden>
 </never-do>`,
 };
diff --git a/tests/agents/executor.test.ts b/tests/agents/executor.test.ts
new file mode 100644
index 0000000..6e7db31
--- /dev/null
+++ b/tests/agents/executor.test.ts
@@ -0,0 +1,40 @@
+import { describe, it, expect } from "bun:test";
+
+describe("executor agent", () => {
+  it("should use background_task instead of Task", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/executor.ts", "utf-8");
+
+    expect(source).toContain("background_task");
+    expect(source).toContain("background_output");
+    expect(source).toContain("background_list");
+  });
+
+  it("should have fire-and-check pattern documentation", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/executor.ts", "utf-8");
+
+    expect(source).toContain("fire-and-check");
+  });
+
+  it("should have fallback-rule section", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/executor.ts", "utf-8");
+
+    expect(source).toContain("<fallback-rule>");
+  });
+
+  it("should have background-tools section", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/executor.ts", "utf-8");
+
+    expect(source).toContain("<background-tools>");
+  });
+
+  it("should describe starting reviewer when implementer finishes", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/agents/executor.ts", "utf-8");
+
+    expect(source).toMatch(/reviewer.*immediately|immediately.*reviewer/i);
+  });
+});

From 23f96a57ffe508b1eb130ef34b284b8890138658 Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Thu, 1 Jan 2026 20:55:19 +0200
Subject: [PATCH 05/14] fix(background-task): add error logging, cleanup,
 response types, and unit tests

- Add error logging to replace silent catch blocks (Task 2)
- Add TTL-based cleanup to prevent memory leak (Task 3)
- Add proper response types for API calls (Task 4)
- Add comprehensive unit tests for BackgroundTaskManager (Task 5)
---
 src/tools/background-task/manager.ts          |  57 +++-
 src/tools/background-task/types.ts            |  34 ++
 tests/tools/background-task-cleanup.test.ts   |  23 ++
 .../background-task-error-logging.test.ts     |  23 ++
 tests/tools/background-task-manager.test.ts   | 309 ++++++++++++++++++
 .../background-task-response-types.test.ts    |  30 ++
 6 files changed, 459 insertions(+), 17 deletions(-)
 create mode 100644 tests/tools/background-task-cleanup.test.ts
 create mode 100644 tests/tools/background-task-error-logging.test.ts
 create mode 100644 tests/tools/background-task-manager.test.ts
 create mode 100644 tests/tools/background-task-response-types.test.ts

diff --git a/src/tools/background-task/manager.ts b/src/tools/background-task/manager.ts
index 4ebb987..6461c4a 100644
--- a/src/tools/background-task/manager.ts
+++ b/src/tools/background-task/manager.ts
@@ -1,7 +1,14 @@
 import type { PluginInput } from "@opencode-ai/plugin";
-import type { BackgroundTask, BackgroundTaskInput } from "./types";
+import type {
+  BackgroundTask,
+  BackgroundTaskInput,
+  SessionCreateResponse,
+  SessionGetResponse,
+  SessionMessagesResponse,
+} from "./types";
 
 const POLL_INTERVAL_MS = 2000;
+const TASK_TTL_MS = 60 * 60 * 1000; // 1 hour
 
 function generateTaskId(): string {
   const chars = "abcdefghijklmnopqrstuvwxyz0123456789";
@@ -42,7 +49,7 @@ export class BackgroundTaskManager {
       query: { directory: this.ctx.directory },
     });
 
-    const sessionData = sessionResp as { data?: { id?: string } };
+    const sessionData = sessionResp as SessionCreateResponse;
     const sessionID = sessionData.data?.id;
 
     if (!sessionID) {
@@ -103,7 +110,9 @@ export class BackgroundTaskManager {
           path: { id: task.sessionID },
           query: { directory: this.ctx.directory },
         })
-        .catch(() => {});
+        .catch((error) => {
+          console.error(`[background-task] Failed to abort session ${task.sessionID}:`, error);
+        });
 
       task.status = "cancelled";
       task.completedAt = new Date();
@@ -155,21 +164,17 @@ export class BackgroundTaskManager {
         query: { directory: this.ctx.directory },
       });
 
-      const messages = (resp as { data?: unknown[] }).data || [];
-      const lastAssistant = [...messages].reverse().find((m) => {
-        const msg = m as Record<string, unknown>;
-        const info = msg.info as Record<string, unknown> | undefined;
-        return info?.role === "assistant";
-      }) as Record<string, unknown> | undefined;
+      const messagesResp = resp as SessionMessagesResponse;
+      const messages = messagesResp.data || [];
+      const lastAssistant = [...messages].reverse().find((m) => m.info?.role === "assistant");
 
       if (lastAssistant) {
-        const parts = lastAssistant.parts as Array<{ type: string; text?: string }> | undefined;
-        const textParts = parts?.filter((p) => p.type === "text") || [];
+        const textParts = lastAssistant.parts?.filter((p) => p.type === "text") || [];
         task.result = textParts.map((p) => p.text || "").join("\n");
         return task.result;
       }
-    } catch {
-      // Ignore errors fetching result
+    } catch (error) {
+      console.error(`[background-task] Failed to fetch result for task ${taskId}:`, error);
     }
 
     return undefined;
@@ -215,7 +220,23 @@ export class BackgroundTaskManager {
     }
   }
 
+  private cleanupOldTasks(): void {
+    const now = Date.now();
+    for (const [taskId, task] of this.tasks) {
+      // Only cleanup completed/cancelled/error tasks
+      if (task.status === "running") continue;
+
+      const completedAt = task.completedAt?.getTime() || 0;
+      if (now - completedAt > TASK_TTL_MS) {
+        this.tasks.delete(taskId);
+      }
+    }
+  }
+
   private async pollRunningTasks(): Promise<void> {
+    // Cleanup old completed tasks to prevent memory leak
+    this.cleanupOldTasks();
+
     const runningTasks = this.getRunningTasks();
 
     if (runningTasks.length === 0) {
@@ -231,7 +252,7 @@ export class BackgroundTaskManager {
           query: { directory: this.ctx.directory },
         });
 
-        const sessionData = resp as { data?: { status?: string } };
+        const sessionData = resp as SessionGetResponse;
         const status = sessionData.data?.status;
 
         if (status === "idle") {
@@ -250,10 +271,12 @@ export class BackgroundTaskManager {
                 duration: 5000,
               },
             })
-            .catch(() => {});
+            .catch((error) => {
+              console.error(`[background-task] Failed to show toast for task ${task.id}:`, error);
+            });
         }
-      } catch {
-        // Session may not exist anymore
+      } catch (error) {
+        console.error(`[background-task] Failed to poll task ${task.id}:`, error);
         if (task.status === "running") {
           task.status = "error";
           task.error = "Session lost";
diff --git a/src/tools/background-task/types.ts b/src/tools/background-task/types.ts
index 757865d..91cbc78 100644
--- a/src/tools/background-task/types.ts
+++ b/src/tools/background-task/types.ts
@@ -25,3 +25,37 @@ export interface BackgroundTaskInput {
   parentSessionID: string;
   parentMessageID: string;
 }
+
+// API Response Types
+export interface SessionCreateResponse {
+  data?: {
+    id?: string;
+  };
+}
+
+export interface SessionGetResponse {
+  data?: {
+    status?: "idle" | "running" | "error";
+  };
+}
+
+export interface MessagePart {
+  type: string;
+  text?: string;
+}
+
+export interface MessageInfo {
+  role?: "user" | "assistant";
+  sessionID?: string;
+  type?: string;
+  name?: string;
+}
+
+export interface SessionMessage {
+  info?: MessageInfo;
+  parts?: MessagePart[];
+}
+
+export interface SessionMessagesResponse {
+  data?: SessionMessage[];
+}
diff --git a/tests/tools/background-task-cleanup.test.ts b/tests/tools/background-task-cleanup.test.ts
new file mode 100644
index 0000000..d3d9378
--- /dev/null
+++ b/tests/tools/background-task-cleanup.test.ts
@@ -0,0 +1,23 @@
+import { describe, it, expect } from "bun:test";
+
+describe("background-task cleanup", () => {
+  it("should have TASK_TTL_MS constant", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/tools/background-task/manager.ts", "utf-8");
+    expect(source).toContain("TASK_TTL_MS");
+  });
+
+  it("should have cleanupOldTasks method", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/tools/background-task/manager.ts", "utf-8");
+    expect(source).toContain("cleanupOldTasks");
+  });
+
+  it("should call cleanup in pollRunningTasks", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/tools/background-task/manager.ts", "utf-8");
+    // Find pollRunningTasks method and verify it calls cleanupOldTasks
+    const pollMethod = source.match(/async pollRunningTasks\(\)[^{]*\{[\s\S]*?^\s{2}\}/m);
+    expect(pollMethod?.[0]).toContain("cleanupOldTasks");
+  });
+});
diff --git a/tests/tools/background-task-error-logging.test.ts b/tests/tools/background-task-error-logging.test.ts
new file mode 100644
index 0000000..0788293
--- /dev/null
+++ b/tests/tools/background-task-error-logging.test.ts
@@ -0,0 +1,23 @@
+import { describe, it, expect } from "bun:test";
+
+describe("background-task error logging", () => {
+  it("should not have silent catch blocks", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/tools/background-task/manager.ts", "utf-8");
+
+    // Should not have empty catch blocks
+    expect(source).not.toMatch(/\.catch\s*\(\s*\(\s*\)\s*=>\s*\{\s*\}\s*\)/);
+  });
+
+  it("should log errors in catch blocks", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/tools/background-task/manager.ts", "utf-8");
+
+    // All .catch blocks should have console.error
+    const catchBlocks = source.match(/\.catch\s*\([^)]+\)/g) || [];
+    for (const block of catchBlocks) {
+      // Each catch should capture the error parameter
+      expect(block).toMatch(/\.catch\s*\(\s*\(\s*\w+\s*\)/);
+    }
+  });
+});
diff --git a/tests/tools/background-task-manager.test.ts b/tests/tools/background-task-manager.test.ts
new file mode 100644
index 0000000..9a4206e
--- /dev/null
+++ b/tests/tools/background-task-manager.test.ts
@@ -0,0 +1,309 @@
+import { describe, it, expect, beforeEach, mock } from "bun:test";
+import { BackgroundTaskManager } from "../../src/tools/background-task/manager";
+
+// Mock the PluginInput context
+function createMockCtx() {
+  return {
+    directory: "/test",
+    client: {
+      session: {
+        create: mock(() => Promise.resolve({ data: { id: "session-123" } })),
+        get: mock(() => Promise.resolve({ data: { status: "idle" } })),
+        messages: mock(() =>
+          Promise.resolve({
+            data: [
+              {
+                info: { role: "assistant" },
+                parts: [{ type: "text", text: "Task result" }],
+              },
+            ],
+          }),
+        ),
+        prompt: mock(() => Promise.resolve({})),
+        abort: mock(() => Promise.resolve({})),
+      },
+      tui: {
+        showToast: mock(() => Promise.resolve({})),
+      },
+    },
+  } as any;
+}
+
+describe("BackgroundTaskManager", () => {
+  let manager: BackgroundTaskManager;
+  let mockCtx: ReturnType<typeof createMockCtx>;
+
+  beforeEach(() => {
+    mockCtx = createMockCtx();
+    manager = new BackgroundTaskManager(mockCtx);
+  });
+
+  describe("launch", () => {
+    it("should create a task with running status", async () => {
+      const task = await manager.launch({
+        description: "Test task",
+        prompt: "Do something",
+        agent: "test-agent",
+        parentSessionID: "parent-123",
+        parentMessageID: "msg-123",
+      });
+
+      expect(task.id).toMatch(/^bg_[a-z0-9]{8}$/);
+      expect(task.status).toBe("running");
+      expect(task.description).toBe("Test task");
+      expect(task.agent).toBe("test-agent");
+      expect(task.sessionID).toBe("session-123");
+    });
+
+    it("should throw if session creation fails", async () => {
+      mockCtx.client.session.create = mock(() => Promise.resolve({ data: {} }));
+
+      await expect(
+        manager.launch({
+          description: "Test",
+          prompt: "Test",
+          agent: "test",
+          parentSessionID: "p",
+          parentMessageID: "m",
+        }),
+      ).rejects.toThrow("Failed to create background session");
+    });
+
+    it("should store task in internal map", async () => {
+      const task = await manager.launch({
+        description: "Test",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+
+      expect(manager.getTask(task.id)).toBe(task);
+    });
+  });
+
+  describe("cancel", () => {
+    it("should cancel a running task", async () => {
+      const task = await manager.launch({
+        description: "Test",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+
+      const result = await manager.cancel(task.id);
+
+      expect(result).toBe(true);
+      expect(task.status).toBe("cancelled");
+      expect(task.completedAt).toBeDefined();
+    });
+
+    it("should return false for non-existent task", async () => {
+      const result = await manager.cancel("non-existent");
+      expect(result).toBe(false);
+    });
+
+    it("should return false for already completed task", async () => {
+      const task = await manager.launch({
+        description: "Test",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+
+      task.status = "completed";
+      const result = await manager.cancel(task.id);
+      expect(result).toBe(false);
+    });
+  });
+
+  describe("cancelAll", () => {
+    it("should cancel all running tasks", async () => {
+      await manager.launch({
+        description: "Task 1",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+      await manager.launch({
+        description: "Task 2",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+
+      const cancelled = await manager.cancelAll();
+
+      expect(cancelled).toBe(2);
+      expect(manager.getRunningTasks().length).toBe(0);
+    });
+  });
+
+  describe("getAllTasks", () => {
+    it("should return all tasks", async () => {
+      await manager.launch({
+        description: "Task 1",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+      await manager.launch({
+        description: "Task 2",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+
+      const tasks = manager.getAllTasks();
+      expect(tasks.length).toBe(2);
+    });
+  });
+
+  describe("getRunningTasks", () => {
+    it("should only return running tasks", async () => {
+      const task1 = await manager.launch({
+        description: "Task 1",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+      await manager.launch({
+        description: "Task 2",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+
+      task1.status = "completed";
+
+      const running = manager.getRunningTasks();
+      expect(running.length).toBe(1);
+      expect(running[0].description).toBe("Task 2");
+    });
+  });
+
+  describe("getTaskResult", () => {
+    it("should return undefined for running task", async () => {
+      const task = await manager.launch({
+        description: "Test",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+
+      const result = await manager.getTaskResult(task.id);
+      expect(result).toBeUndefined();
+    });
+
+    it("should fetch and cache result for completed task", async () => {
+      const task = await manager.launch({
+        description: "Test",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+
+      task.status = "completed";
+      const result = await manager.getTaskResult(task.id);
+
+      expect(result).toBe("Task result");
+      expect(task.result).toBe("Task result");
+
+      // Second call should use cached result
+      const result2 = await manager.getTaskResult(task.id);
+      expect(result2).toBe("Task result");
+      expect(mockCtx.client.session.messages).toHaveBeenCalledTimes(1);
+    });
+  });
+
+  describe("formatTaskStatus", () => {
+    it("should format task status as markdown table", async () => {
+      const task = await manager.launch({
+        description: "Test task",
+        prompt: "Test",
+        agent: "test-agent",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+
+      const output = manager.formatTaskStatus(task);
+
+      expect(output).toContain("## Task: Test task");
+      expect(output).toContain("| ID |");
+      expect(output).toContain("| Status | RUNNING |");
+      expect(output).toContain("| Agent | test-agent |");
+    });
+
+    it("should include error if present", async () => {
+      const task = await manager.launch({
+        description: "Test",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+
+      task.status = "error";
+      task.error = "Something went wrong";
+
+      const output = manager.formatTaskStatus(task);
+      expect(output).toContain("### Error");
+      expect(output).toContain("Something went wrong");
+    });
+  });
+
+  describe("handleEvent", () => {
+    it("should track tool usage from message.part.updated events", async () => {
+      const task = await manager.launch({
+        description: "Test",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+
+      manager.handleEvent({
+        type: "message.part.updated",
+        properties: {
+          info: {
+            sessionID: task.sessionID,
+            type: "tool_use",
+            name: "read",
+          },
+        },
+      });
+
+      expect(task.progress?.toolCalls).toBe(1);
+      expect(task.progress?.lastTool).toBe("read");
+    });
+
+    it("should cancel task on session.deleted event", async () => {
+      const task = await manager.launch({
+        description: "Test",
+        prompt: "Test",
+        agent: "test",
+        parentSessionID: "p",
+        parentMessageID: "m",
+      });
+
+      manager.handleEvent({
+        type: "session.deleted",
+        properties: {
+          info: { id: task.sessionID },
+        },
+      });
+
+      expect(task.status).toBe("cancelled");
+    });
+  });
+});
diff --git a/tests/tools/background-task-response-types.test.ts b/tests/tools/background-task-response-types.test.ts
new file mode 100644
index 0000000..927c579
--- /dev/null
+++ b/tests/tools/background-task-response-types.test.ts
@@ -0,0 +1,30 @@
+import { describe, it, expect } from "bun:test";
+
+describe("background-task response types", () => {
+  it("should have SessionCreateResponse type", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/tools/background-task/types.ts", "utf-8");
+    expect(source).toContain("SessionCreateResponse");
+  });
+
+  it("should have SessionGetResponse type", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/tools/background-task/types.ts", "utf-8");
+    expect(source).toContain("SessionGetResponse");
+  });
+
+  it("should have SessionMessagesResponse type", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/tools/background-task/types.ts", "utf-8");
+    expect(source).toContain("SessionMessagesResponse");
+  });
+
+  it("should use typed responses in manager", async () => {
+    const fs = await import("node:fs/promises");
+    const source = await fs.readFile("src/tools/background-task/manager.ts", "utf-8");
+    // Should import the response types
+    expect(source).toContain("SessionCreateResponse");
+    expect(source).toContain("SessionGetResponse");
+    expect(source).toContain("SessionMessagesResponse");
+  });
+});

From fb720d7dd34905911b86da7e83144a0d8205aed9 Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Fri, 2 Jan 2026 17:29:55 +0200
Subject: [PATCH 06/14] fix(background-task): add missing console.error and
 improve test coverage

- Add console.error to prompt session catch block
- Improve test to verify catch block bodies contain console.error
- Test now catches silent catch blocks like .catch((err) => {})
---
 src/tools/background-task/manager.ts          |  1 +
 .../background-task-error-logging.test.ts     | 25 +++++++++++++------
 2 files changed, 19 insertions(+), 7 deletions(-)

diff --git a/src/tools/background-task/manager.ts b/src/tools/background-task/manager.ts
index 6461c4a..1f4a0ab 100644
--- a/src/tools/background-task/manager.ts
+++ b/src/tools/background-task/manager.ts
@@ -85,6 +85,7 @@ export class BackgroundTaskManager {
         query: { directory: this.ctx.directory },
       })
       .catch((error) => {
+        console.error(`[background-task] Failed to prompt session ${sessionID}:`, error);
         task.status = "error";
         task.error = error instanceof Error ? error.message : String(error);
         task.completedAt = new Date();
diff --git a/tests/tools/background-task-error-logging.test.ts b/tests/tools/background-task-error-logging.test.ts
index 0788293..28922a7 100644
--- a/tests/tools/background-task-error-logging.test.ts
+++ b/tests/tools/background-task-error-logging.test.ts
@@ -5,19 +5,30 @@ describe("background-task error logging", () => {
     const fs = await import("node:fs/promises");
     const source = await fs.readFile("src/tools/background-task/manager.ts", "utf-8");
 
-    // Should not have empty catch blocks
+    // Should not have empty catch blocks like .catch(() => {})
     expect(source).not.toMatch(/\.catch\s*\(\s*\(\s*\)\s*=>\s*\{\s*\}\s*\)/);
+
+    // Should not have catch blocks that capture error but do nothing
+    // e.g., .catch((err) => {}) or .catch((error) => {})
+    expect(source).not.toMatch(/\.catch\s*\(\s*\(\s*\w+\s*\)\s*=>\s*\{\s*\}\s*\)/);
   });
 
-  it("should log errors in catch blocks", async () => {
+  it("should log errors in catch blocks with console.error", async () => {
     const fs = await import("node:fs/promises");
     const source = await fs.readFile("src/tools/background-task/manager.ts", "utf-8");
 
-    // All .catch blocks should have console.error
-    const catchBlocks = source.match(/\.catch\s*\([^)]+\)/g) || [];
-    for (const block of catchBlocks) {
-      // Each catch should capture the error parameter
-      expect(block).toMatch(/\.catch\s*\(\s*\(\s*\w+\s*\)/);
+    // Find all .catch blocks with their full body using a more comprehensive regex
+    // Match .catch((param) => { ... }) including multiline
+    const catchRegex = /\.catch\s*\(\s*\(\s*(\w+)\s*\)\s*=>\s*\{([^}]*(?:\{[^}]*\}[^}]*)*)\}\s*\)/g;
+    const matches = [...source.matchAll(catchRegex)];
+
+    // Should have at least some catch blocks
+    expect(matches.length).toBeGreaterThan(0);
+
+    for (const match of matches) {
+      const catchBody = match[2];
+      // Each catch block body should contain console.error
+      expect(catchBody).toContain("console.error");
     }
   });
 });

From 32131a7d5cf33b5f1a493027d162b6fcd491034e Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Fri, 2 Jan 2026 17:31:07 +0200
Subject: [PATCH 07/14] fix(background-task): re-fetch task status in blocking
 poll loop

The blocking wait loop was checking a stale task object instead of
re-fetching the current status, causing infinite hangs when block=true.
---
 src/tools/background-task/tools.ts | 17 ++++++++++++++---
 1 file changed, 14 insertions(+), 3 deletions(-)

diff --git a/src/tools/background-task/tools.ts b/src/tools/background-task/tools.ts
index 68677e5..b63a330 100644
--- a/src/tools/background-task/tools.ts
+++ b/src/tools/background-task/tools.ts
@@ -59,16 +59,27 @@ Set block=true to wait for completion (with timeout).`,
         const maxWait = Math.min(timeout || 60, 600) * 1000;
         const startTime = Date.now();
 
-        while (task.status === "running" && Date.now() - startTime < maxWait) {
+        while (Date.now() - startTime < maxWait) {
+          // Re-fetch task to get updated status
+          const currentTask = manager.getTask(task_id);
+          if (!currentTask || currentTask.status !== "running") {
+            break;
+          }
           await new Promise((resolve) => setTimeout(resolve, 1000));
         }
       }
 
+      // Re-fetch task for final status
+      const finalTask = manager.getTask(task_id);
+      if (!finalTask) {
+        return `Task not found: ${task_id}`;
+      }
+
       // Format status
-      let output = manager.formatTaskStatus(task);
+      let output = manager.formatTaskStatus(finalTask);
 
       // Include result if completed
-      if (task.status === "completed") {
+      if (finalTask.status === "completed") {
         const result = await manager.getTaskResult(task_id);
         if (result) {
           output += `\n### Result\n${result}\n`;

From 655e491f9ec8271931e9ead6f71438ea1dacecf7 Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Fri, 2 Jan 2026 17:39:07 +0200
Subject: [PATCH 08/14] chore: update @opencode-ai/plugin to 1.0.223

---
 bun.lock     | 6 +++---
 package.json | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/bun.lock b/bun.lock
index 6cef8ca..491d85b 100644
--- a/bun.lock
+++ b/bun.lock
@@ -5,7 +5,7 @@
     "": {
       "name": "@vtemian/opencode-config",
       "dependencies": {
-        "@opencode-ai/plugin": "^1.0.219",
+        "@opencode-ai/plugin": "1.0.223",
       },
       "devDependencies": {
         "@biomejs/biome": "^2.3.10",
@@ -33,9 +33,9 @@
 
     "@biomejs/cli-win32-x64": ["@biomejs/cli-win32-x64@2.3.10", "", { "os": "win32", "cpu": "x64" }, "sha512-pHEFgq7dUEsKnqG9mx9bXihxGI49X+ar+UBrEIj3Wqj3UCZp1rNgV+OoyjFgcXsjCWpuEAF4VJdkZr3TrWdCbQ=="],
 
-    "@opencode-ai/plugin": ["@opencode-ai/plugin@1.0.219", "", { "dependencies": { "@opencode-ai/sdk": "1.0.219", "zod": "4.1.8" } }, "sha512-acyaJd/LuSo/h2RFP8sXX89KZ4aLGjqPJVRkA47ccQGDMcwAzjK9JPJOrmNPzykDWQLVCX66bKKO1Equ82VVvQ=="],
+    "@opencode-ai/plugin": ["@opencode-ai/plugin@1.0.223", "", { "dependencies": { "@opencode-ai/sdk": "1.0.223", "zod": "4.1.8" } }, "sha512-ZQAB7woEWHTpDlZrr+WYwIFI/QrmPblGk1nYLRObtpdMFoP8e2zLwE61j0IL4eBrgWY23+Xc2MrALZnkWL4O2Q=="],
 
-    "@opencode-ai/sdk": ["@opencode-ai/sdk@1.0.219", "", {}, "sha512-thbbQsNhkR4M7hKXy1YK+ekMa6rnuDNNqFt1fCjf3zx7h/DLkoI8ll1MDw/Do/cSzcYuTgVCMV1H+lLDQN0I6A=="],
+    "@opencode-ai/sdk": ["@opencode-ai/sdk@1.0.223", "", {}, "sha512-oKJ6QjsviE+lt6cpGu0lL2kWuoj84ZkWvwieyqHEQ2pJunAJqUzhmIhzep0QyDax1/+UXhBWfrnciNt48ch66w=="],
 
     "@types/node": ["@types/node@25.0.3", "", { "dependencies": { "undici-types": "~7.16.0" } }, "sha512-W609buLVRVmeW693xKfzHeIV6nJGGz98uCPfeXI1ELMLXVeKYZ9m15fAMSaUPBHYLGFsVRcMmSCksQOrZV9BYA=="],
 
diff --git a/package.json b/package.json
index ccf222f..7a6176b 100644
--- a/package.json
+++ b/package.json
@@ -44,7 +44,7 @@
     "url": "https://github.com/vtemian/micode/issues"
   },
   "dependencies": {
-    "@opencode-ai/plugin": "^1.0.219"
+    "@opencode-ai/plugin": "1.0.223"
   },
   "devDependencies": {
     "@biomejs/biome": "^2.3.10",

From 5954beefe50d2bd95363266bb1a1400420fddc6b Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Fri, 2 Jan 2026 17:41:22 +0200
Subject: [PATCH 09/14] chore: update @opencode-ai/plugin to 1.0.224

---
 bun.lock     | 6 +++---
 package.json | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/bun.lock b/bun.lock
index 491d85b..8b80a7b 100644
--- a/bun.lock
+++ b/bun.lock
@@ -5,7 +5,7 @@
     "": {
       "name": "@vtemian/opencode-config",
       "dependencies": {
-        "@opencode-ai/plugin": "1.0.223",
+        "@opencode-ai/plugin": "^1.0.224",
       },
       "devDependencies": {
         "@biomejs/biome": "^2.3.10",
@@ -33,9 +33,9 @@
 
     "@biomejs/cli-win32-x64": ["@biomejs/cli-win32-x64@2.3.10", "", { "os": "win32", "cpu": "x64" }, "sha512-pHEFgq7dUEsKnqG9mx9bXihxGI49X+ar+UBrEIj3Wqj3UCZp1rNgV+OoyjFgcXsjCWpuEAF4VJdkZr3TrWdCbQ=="],
 
-    "@opencode-ai/plugin": ["@opencode-ai/plugin@1.0.223", "", { "dependencies": { "@opencode-ai/sdk": "1.0.223", "zod": "4.1.8" } }, "sha512-ZQAB7woEWHTpDlZrr+WYwIFI/QrmPblGk1nYLRObtpdMFoP8e2zLwE61j0IL4eBrgWY23+Xc2MrALZnkWL4O2Q=="],
+    "@opencode-ai/plugin": ["@opencode-ai/plugin@1.0.224", "", { "dependencies": { "@opencode-ai/sdk": "1.0.224", "zod": "4.1.8" } }, "sha512-V2Su55FI6NGyabFHo853+8r9h66q//gsYWCIODbwRs47qi4VfbFylfddJxQDD+/M/H7w0++ojbQC9YCLNDXdKw=="],
 
-    "@opencode-ai/sdk": ["@opencode-ai/sdk@1.0.223", "", {}, "sha512-oKJ6QjsviE+lt6cpGu0lL2kWuoj84ZkWvwieyqHEQ2pJunAJqUzhmIhzep0QyDax1/+UXhBWfrnciNt48ch66w=="],
+    "@opencode-ai/sdk": ["@opencode-ai/sdk@1.0.224", "", {}, "sha512-gODyWLDTaz38qISxRdJKsEiFqvJNcFzu4/awoSICIl8j8gx6qDxLsYWVp/ToO4LKXTvHMn8yyZpM3ZEdGhDC+g=="],
 
     "@types/node": ["@types/node@25.0.3", "", { "dependencies": { "undici-types": "~7.16.0" } }, "sha512-W609buLVRVmeW693xKfzHeIV6nJGGz98uCPfeXI1ELMLXVeKYZ9m15fAMSaUPBHYLGFsVRcMmSCksQOrZV9BYA=="],
 
diff --git a/package.json b/package.json
index 7a6176b..d29a377 100644
--- a/package.json
+++ b/package.json
@@ -44,7 +44,7 @@
     "url": "https://github.com/vtemian/micode/issues"
   },
   "dependencies": {
-    "@opencode-ai/plugin": "1.0.223"
+    "@opencode-ai/plugin": "^1.0.224"
   },
   "devDependencies": {
     "@biomejs/biome": "^2.3.10",

From 8c4829ff14626dae688ea548e4ff62e0ebb91d31 Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Fri, 2 Jan 2026 17:46:51 +0200
Subject: [PATCH 10/14] refactor(background-task): remove block parameter, use
 polling pattern

- Remove block and timeout params from background_output tool
- Update executor, planner, project-initializer to use polling pattern
- Poll with background_list, then collect with background_output
- Simpler, more visible, no hanging
---
 src/agents/executor.ts             | 19 ++++++++------
 src/agents/planner.ts              | 19 ++++++++------
 src/agents/project-initializer.ts  | 40 ++++++++++++++++--------------
 src/tools/background-task/tools.ts | 34 ++++---------------------
 4 files changed, 49 insertions(+), 63 deletions(-)

diff --git a/src/agents/executor.ts b/src/agents/executor.ts
index c5e0f97..fff1ff0 100644
--- a/src/agents/executor.ts
+++ b/src/agents/executor.ts
@@ -98,15 +98,17 @@ For each task:
 Within a batch:
 1. Fire ALL implementers as background_task in ONE message
 2. Enter polling loop:
-   a. Call background_list to check status
-   b. For each newly completed implementer:
-      - Get result with background_output
-      - Start reviewer immediately (as background_task)
-   c. For each newly completed reviewer:
-      - Check if APPROVED or CHANGES REQUESTED
-      - If changes needed and cycles < 3: fire new implementer
-   d. Repeat until all tasks in batch are done or blocked
+   a. Call background_list to check status of ALL tasks
+   b. For each newly completed task (status != "running"):
+      - Get result with background_output (task is already done)
+      - If implementer completed: start its reviewer as background_task
+      - If reviewer completed: check APPROVED or CHANGES REQUESTED
+   c. If changes needed and cycles < 3: fire new implementer
+   d. Sleep briefly, then repeat until all tasks done or blocked
 3. Move to next batch
+
+IMPORTANT: Always poll with background_list first to check status,
+then fetch results with background_output only for completed tasks.
 </fire-and-check-loop>
 
 <fallback-rule>
@@ -184,6 +186,7 @@ background_task(description="Review 3", prompt="Review task 3 implementation", a
 </output-format>
 
 <never-do>
+<forbidden>NEVER call background_output on running tasks - always poll with background_list first</forbidden>
 <forbidden>Never skip dependency analysis</forbidden>
 <forbidden>Never spawn dependent tasks in parallel</forbidden>
 <forbidden>Never skip reviewer for any task</forbidden>
diff --git a/src/agents/planner.ts b/src/agents/planner.ts
index de0a400..3c767d0 100644
--- a/src/agents/planner.ts
+++ b/src/agents/planner.ts
@@ -22,8 +22,8 @@ Every task is bite-sized (2-5 minutes), with exact paths and complete code.
 
 <background-tools>
   <tool name="background_task">Fire subagent tasks that run in parallel. Returns task_id immediately.</tool>
-  <tool name="background_output">Collect results from background tasks. Use block=true to wait for completion.</tool>
-  <tool name="background_list">List all background tasks and their status.</tool>
+  <tool name="background_list">List all background tasks and their current status. Use to poll for completion.</tool>
+  <tool name="background_output">Get results from a completed task. Only call after background_list shows task is done.</tool>
 </background-tools>
 
 <fallback-rule>
@@ -86,8 +86,9 @@ All research must serve the design - never second-guess design decisions.
     - context7_resolve-library-id + context7_query-docs for API docs
     - btca_ask for library internals when needed
   </fire-phase>
-  <collect-phase description="Wait for all results">
-    - background_output(task_id=..., block=true) for each background task
+  <collect-phase description="Poll until all complete, then collect">
+    - Poll with background_list until all tasks show completed
+    - Call background_output(task_id=...) for each completed task
     - Combine all results for planning phase
   </collect-phase>
   <rule>Only research what's needed to implement the design</rule>
@@ -191,10 +192,12 @@ context7_resolve-library-id(libraryName="express")  // runs in parallel
 btca_ask(tech="express", question="middleware chain order")  // runs in parallel
 </step>
 <step name="collect">
-// Wait for all background tasks to complete:
-background_output(task_id=task_id_1, block=true)  // blocks until complete
-background_output(task_id=task_id_2, block=true)
-background_output(task_id=task_id_3, block=true)
+// Poll until all background tasks complete:
+background_list()  // check status of all tasks
+// When all show "completed":
+background_output(task_id=task_id_1)  // get result
+background_output(task_id=task_id_2)  // get result
+background_output(task_id=task_id_3)  // get result
 // context7 and btca_ask results already available from fire step
 </step>
 <step name="plan">
diff --git a/src/agents/project-initializer.ts b/src/agents/project-initializer.ts
index 9da543a..8e475a5 100644
--- a/src/agents/project-initializer.ts
+++ b/src/agents/project-initializer.ts
@@ -29,15 +29,15 @@ const PROMPT = `
       Parameters: description, prompt, agent (subagent type)
       Example: background_task(description="Find entry points", prompt="Find all entry points", agent="codebase-locator")
     </tool>
-    <tool name="background_output">
-      Get results from a background task. Use block=true to wait for completion.
-      Parameters: task_id, block (boolean), timeout (optional)
-      Example: background_output(task_id="abc123", block=true)
-    </tool>
     <tool name="background_list">
-      List all background tasks and their status.
+      List all background tasks and their status. Use to poll for completion.
       No parameters required.
     </tool>
+    <tool name="background_output">
+      Get results from a completed task. Only call after background_list shows task is done.
+      Parameters: task_id
+      Example: background_output(task_id="abc123")
+    </tool>
   </background-tools>
 
   <parallel-execution-strategy pattern="fire-and-collect">
@@ -58,9 +58,10 @@ const PROMPT = `
       </parallel-tools>
     </phase>
 
-    <phase name="2-collect" description="Collect all results">
-      <description>Use background_output(block=true) to collect each result</description>
-      <action>Collect results from all fired agents</action>
+    <phase name="2-collect" description="Poll and collect all results">
+      <description>Poll background_list until all tasks complete, then collect with background_output</description>
+      <action>Poll background_list until all tasks show "completed"</action>
+      <action>Call background_output for each completed task</action>
       <action>Process tool results from phase 1</action>
     </phase>
 
@@ -118,8 +119,9 @@ const PROMPT = `
 
   <critical-instruction>
     Use background_task to fire subagents for TRUE parallelism.
-    Fire ALL background_task calls in a SINGLE message, then collect with background_output(block=true).
-    This is the fire-and-collect pattern - fire everything, then collect everything.
+    Fire ALL background_task calls in a SINGLE message.
+    Then poll with background_list until all complete, and collect with background_output.
+    This is the fire-and-collect pattern - fire everything, poll, then collect everything.
   </critical-instruction>
 
   <language-detection>
@@ -225,13 +227,15 @@ const PROMPT = `
       - Glob: README*, ARCHITECTURE*, docs/*
     </step>
 
-    <step description="COLLECT: Gather all results">
-      In a SINGLE message, collect ALL results:
-      - background_output(task_id=task_id_1, block=true)
-      - background_output(task_id=task_id_2, block=true)
-      - background_output(task_id=task_id_3, block=true)
-      - background_output(task_id=task_id_4, block=true)
-      - background_output(task_id=task_id_5, block=true)
+    <step description="COLLECT: Poll and gather all results">
+      First poll until all tasks complete:
+      - background_list()  // repeat until all show "completed"
+      Then collect ALL results:
+      - background_output(task_id=task_id_1)
+      - background_output(task_id=task_id_2)
+      - background_output(task_id=task_id_3)
+      - background_output(task_id=task_id_4)
+      - background_output(task_id=task_id_5)
     </step>
 
     <step description="FIRE: Deep analysis based on discovery">
diff --git a/src/tools/background-task/tools.ts b/src/tools/background-task/tools.ts
index b63a330..41f3c30 100644
--- a/src/tools/background-task/tools.ts
+++ b/src/tools/background-task/tools.ts
@@ -38,48 +38,24 @@ Use \`background_output\` with task_id="${task.id}" to check progress or get res
   });
 
   const background_output = tool({
-    description: `Check status or get results from a background task.
-By default returns immediately with current status.
-Set block=true to wait for completion (with timeout).`,
+    description: `Get status or results from a background task.
+Returns immediately with current status. Use background_list to poll for completion.`,
     args: {
       task_id: tool.schema.string().describe("ID of the task to check (e.g., 'bg_abc12345')"),
-      block: tool.schema.boolean().optional().describe("Wait for task completion (default: false)"),
-      timeout: tool.schema.number().optional().describe("Max seconds to wait if blocking (default: 60, max: 600)"),
     },
     execute: async (args) => {
-      const { task_id, block = false, timeout = 60 } = args;
+      const { task_id } = args;
 
       const task = manager.getTask(task_id);
       if (!task) {
         return `Task not found: ${task_id}`;
       }
 
-      // If blocking, wait for completion
-      if (block && task.status === "running") {
-        const maxWait = Math.min(timeout || 60, 600) * 1000;
-        const startTime = Date.now();
-
-        while (Date.now() - startTime < maxWait) {
-          // Re-fetch task to get updated status
-          const currentTask = manager.getTask(task_id);
-          if (!currentTask || currentTask.status !== "running") {
-            break;
-          }
-          await new Promise((resolve) => setTimeout(resolve, 1000));
-        }
-      }
-
-      // Re-fetch task for final status
-      const finalTask = manager.getTask(task_id);
-      if (!finalTask) {
-        return `Task not found: ${task_id}`;
-      }
-
       // Format status
-      let output = manager.formatTaskStatus(finalTask);
+      let output = manager.formatTaskStatus(task);
 
       // Include result if completed
-      if (finalTask.status === "completed") {
+      if (task.status === "completed") {
         const result = await manager.getTaskResult(task_id);
         if (result) {
           output += `\n### Result\n${result}\n`;

From 40f8a848258b5fc4ac759e64ab09b2dc6d3678ea Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Fri, 2 Jan 2026 17:52:34 +0200
Subject: [PATCH 11/14] feat(brainstormer): use background_task for parallel
 research and auto-handoff to planner

- Use background_task instead of Task for parallel codebase research
- Fire-poll-collect pattern matches planner and executor
- Auto-spawn planner when user approves design (no extra confirmation)
- Add handoff phase for smooth transition to planning
---
 src/agents/brainstormer.ts | 71 +++++++++++++++++++++++++++-----------
 1 file changed, 50 insertions(+), 21 deletions(-)

diff --git a/src/agents/brainstormer.ts b/src/agents/brainstormer.ts
index 79bb0a5..b19343f 100644
--- a/src/agents/brainstormer.ts
+++ b/src/agents/brainstormer.ts
@@ -13,34 +13,50 @@ This is DESIGN ONLY. The planner agent handles detailed implementation plans.
 <critical-rules>
   <rule priority="HIGHEST">ONE QUESTION AT A TIME: Ask exactly ONE question, then STOP and wait for the user's response. NEVER ask multiple questions in a single message. This is the most important rule.</rule>
   <rule>NO CODE: Never write code. Never provide code examples. Design only.</rule>
-  <rule>SUBAGENTS: Spawn multiple in parallel for codebase analysis.</rule>
-  <rule>TOOLS (grep, read, etc.): Do NOT use directly - use subagents instead.</rule>
+  <rule>BACKGROUND TASKS: Use background_task for parallel codebase analysis.</rule>
+  <rule>TOOLS (grep, read, etc.): Do NOT use directly - use background subagents instead.</rule>
 </critical-rules>
 
+<background-tools>
+  <tool name="background_task">Fire subagent tasks that run in parallel. Returns task_id immediately.</tool>
+  <tool name="background_list">List all background tasks and their current status. Use to poll for completion.</tool>
+  <tool name="background_output">Get results from a completed task. Only call after background_list shows task is done.</tool>
+</background-tools>
+
 <available-subagents>
-  <subagent name="codebase-locator" spawn="parallel">
-    Find files, modules, patterns. Spawn multiple with different queries.
-    Examples: "Find authentication code", "Find API routes", "Find config files"
+  <subagent name="codebase-locator" spawn="background_task">
+    Find files, modules, patterns. Fire multiple with different queries.
+    Example: background_task(agent="codebase-locator", prompt="Find authentication code", description="Find auth files")
+  </subagent>
+  <subagent name="codebase-analyzer" spawn="background_task">
+    Deep analysis of specific modules. Fire multiple for different areas.
+    Example: background_task(agent="codebase-analyzer", prompt="Analyze the auth module", description="Analyze auth")
   </subagent>
-  <subagent name="codebase-analyzer" spawn="parallel">
-    Deep analysis of specific modules. Spawn multiple for different areas.
-    Examples: "Analyze the auth module", "Explain the data layer"
+  <subagent name="pattern-finder" spawn="background_task">
+    Find existing patterns in codebase. Fire for different pattern types.
+    Example: background_task(agent="pattern-finder", prompt="Find error handling patterns", description="Find error patterns")
   </subagent>
-  <subagent name="pattern-finder" spawn="parallel">
-    Find existing patterns in codebase. Spawn for different pattern types.
-    Examples: "Find error handling patterns", "Find how similar features are implemented"
+  <subagent name="planner" spawn="Task" when="design approved">
+    Creates detailed implementation plan from validated design.
+    Example: Task(subagent_type="planner", prompt="Create implementation plan for [design path]", description="Create plan")
   </subagent>
 </available-subagents>
 
 <process>
-<phase name="understanding">
-  <action>Spawn subagents in PARALLEL to gather context:</action>
-  <spawn-example>
-    In a SINGLE message, spawn:
-    - codebase-locator: "Find files related to [topic]"
-    - codebase-analyzer: "Analyze existing [related feature]"
-    - pattern-finder: "Find patterns for [similar functionality]"
-  </spawn-example>
+<phase name="understanding" pattern="fire-poll-collect">
+  <action>Fire background tasks in PARALLEL to gather context:</action>
+  <fire-example>
+    In a SINGLE message, fire ALL background tasks:
+    background_task(agent="codebase-locator", prompt="Find files related to [topic]", description="Find [topic] files")
+    background_task(agent="codebase-analyzer", prompt="Analyze existing [related feature]", description="Analyze [feature]")
+    background_task(agent="pattern-finder", prompt="Find patterns for [similar functionality]", description="Find patterns")
+  </fire-example>
+  <poll>
+    background_list()  // repeat until all show "completed"
+  </poll>
+  <collect>
+    background_output(task_id=...) for each completed task
+  </collect>
   <focus>purpose, constraints, success criteria</focus>
 </phase>
 
@@ -70,16 +86,29 @@ This is DESIGN ONLY. The planner agent handles detailed implementation plans.
   <action>Commit the design document to git</action>
   <action>Ask: "Ready for the planner to create a detailed implementation plan?"</action>
 </phase>
+
+<phase name="handoff" trigger="user approves design">
+  <action>When user says yes/approved/ready, IMMEDIATELY spawn the planner:</action>
+  <spawn>
+    Task(
+      subagent_type="planner",
+      prompt="Create a detailed implementation plan based on the design at thoughts/shared/designs/YYYY-MM-DD-{topic}-design.md",
+      description="Create implementation plan"
+    )
+  </spawn>
+  <rule>Do NOT ask again - if user approved, spawn planner immediately</rule>
+</phase>
 </process>
 
 <principles>
   <principle name="design-only">NO CODE. Describe components, not implementations. Planner writes code.</principle>
-  <principle name="subagents-first">ALWAYS use subagents for code analysis, NEVER tools directly</principle>
-  <principle name="parallel-spawn">Spawn multiple subagents in a SINGLE message</principle>
+  <principle name="background-tasks">Use background_task for parallel research, poll with background_list, collect with background_output</principle>
+  <principle name="parallel-fire">Fire ALL background tasks in a SINGLE message for true parallelism</principle>
   <principle name="one-question">Ask exactly ONE question per message. STOP after asking. Wait for user's answer before continuing. NEVER bundle multiple questions together.</principle>
   <principle name="yagni">Remove unnecessary features from ALL designs</principle>
   <principle name="explore-alternatives">ALWAYS propose 2-3 approaches before settling</principle>
   <principle name="incremental-validation">Present in sections, validate each before proceeding</principle>
+  <principle name="auto-handoff">When user approves design, IMMEDIATELY spawn planner - don't ask again</principle>
 </principles>
 
 <never-do>

From 2dd6ebf81fab6c408d01eb15a543d768cd07742c Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Fri, 2 Jan 2026 17:54:37 +0200
Subject: [PATCH 12/14] feat(implementer): add commit step after successful
 verification

- Commit after tests/types pass
- Use commit message from plan
- Stage only task-related files
- Do not push (executor handles that)
---
 src/agents/implementer.ts | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/src/agents/implementer.ts b/src/agents/implementer.ts
index 64c75f0..ebd527a 100644
--- a/src/agents/implementer.ts
+++ b/src/agents/implementer.ts
@@ -27,6 +27,7 @@ Execute the plan. Write code. Verify.
 <step>Verify preconditions match plan</step>
 <step>Make the changes</step>
 <step>Run verification (tests, lint, build)</step>
+<step>If verification passes: commit with message from plan</step>
 <step>Report results</step>
 </process>
 
@@ -40,8 +41,17 @@ Execute the plan. Write code. Verify.
 <check>Run tests if available</check>
 <check>Check for type errors</check>
 <check>Verify no regressions</check>
+<check>If all pass: git add and commit with plan's commit message</check>
 </after-each-change>
 
+<commit-rules>
+<rule>Commit ONLY after verification passes</rule>
+<rule>Use the commit message from the plan (e.g., "feat(scope): description")</rule>
+<rule>Stage only the files mentioned in the task</rule>
+<rule>If plan doesn't specify commit message, use: "feat(task): [task description]"</rule>
+<rule>Do NOT push - just commit locally</rule>
+</commit-rules>
+
 <output-format>
 <template>
 ## Task: [Description]
@@ -54,6 +64,8 @@ Execute the plan. Write code. Verify.
 - [x] Types check
 - [ ] Manual check needed: [what]
 
+**Commit**: \`[commit hash]\` - [commit message]
+
 **Issues**: None / [description]
 </template>
 </output-format>

From d6b0b50fde3f1485358291f6c4a12e607c06fbf4 Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Sat, 3 Jan 2026 14:41:35 +0200
Subject: [PATCH 13/14] docs: update README with background task changes

- Brainstormer: uses background_task, auto-handoff to planner
- Planner: library research tools (context7, btca_ask)
- Executor: fire-and-check pattern with polling
- Implementer: commits after verification
- Tools: add btca_ask, document fire-poll-collect pattern
---
 README.md | 86 +++++++++++++++++++++++++++++++++++++++++--------------
 1 file changed, 64 insertions(+), 22 deletions(-)

diff --git a/README.md b/README.md
index 6d2adcf..222290f 100644
--- a/README.md
+++ b/README.md
@@ -45,13 +45,14 @@ Research subagents (codebase-locator, codebase-analyzer, pattern-finder) are spa
 
 Refine rough ideas into fully-formed designs through collaborative questioning.
 
-- One question at a time
+- One question at a time (critical rule!)
 - 2-3 approaches with trade-offs
 - Section-by-section validation
-- Spawns research subagents to understand codebase
+- Fires research subagents in parallel via `background_task`
+- Auto-hands off to planner when user approves
 - Output: `thoughts/shared/designs/YYYY-MM-DD-{topic}-design.md`
 
-**Research subagents** (spawned in parallel):
+**Research subagents** (fired in parallel via background_task):
 
 | Subagent | Purpose |
 |----------|---------|
@@ -59,17 +60,27 @@ Refine rough ideas into fully-formed designs through collaborative questioning.
 | `codebase-analyzer` | Explain HOW code works (with file:line refs) |
 | `pattern-finder` | Find existing patterns to follow |
 
+**Auto-handoff:** When user approves the design, brainstormer automatically spawns the planner - no extra confirmation needed.
+
 ### 2. Plan
 
 Transform validated designs into comprehensive implementation plans.
 
-- Spawns research subagents for exact paths, signatures, patterns
+- Fires research subagents in parallel via `background_task`
+- Uses `context7` and `btca_ask` for external library documentation
 - Bite-sized tasks (2-5 minutes each)
 - Exact file paths, complete code examples
 - TDD workflow: failing test → verify fail → implement → verify pass → commit
 - Get human approval before implementing
 - Output: `thoughts/shared/plans/YYYY-MM-DD-{topic}.md`
 
+**Library research tools:**
+
+| Tool | Purpose |
+|------|---------|
+| `context7` | Documentation lookup for external libraries |
+| `btca_ask` | Source code search for library internals |
+
 ### 3. Implement
 
 Execute plan in git worktree for isolation:
@@ -104,34 +115,47 @@ Dependent tasks (must be sequential):
 - Task B's test relies on Task A's implementation
 ```
 
-#### Parallel Execution
+#### Parallel Execution (Fire-and-Check Pattern)
+
+The executor uses a **fire-and-check** pattern for maximum parallelism:
 
-Within a batch, all tasks run concurrently by spawning multiple subagents in a single message:
+1. **Fire** - Launch all implementers as `background_task` in ONE message
+2. **Poll** - Check `background_list` for completions
+3. **React** - Start reviewer immediately when each implementer finishes
+4. **Repeat** - Continue polling until batch complete
 
 ```
 Plan with 6 tasks:
 ├── Batch 1 (parallel): Tasks 1, 2, 3 → independent, different files
-│   ├── implementer: task 1 ─┐
-│   ├── implementer: task 2 ─┼─ spawn in ONE message
-│   └── implementer: task 3 ─┘
-│   [wait for all]
-│   ├── reviewer: task 1 ─┐
-│   ├── reviewer: task 2 ─┼─ spawn in ONE message
-│   └── reviewer: task 3 ─┘
-│   [wait for all]
+│   │
+│   │ FIRE: background_task(agent="implementer") x3
+│   │
+│   │ POLL: background_list() → task 2 completed!
+│   │ → background_output(task_2)
+│   │ → background_task(agent="reviewer", "Review task 2")
+│   │
+│   │ POLL: background_list() → tasks 1, 3 completed!
+│   │ → start reviewers for 1 and 3
+│   │
+│   │ [continue until all reviewed]
 │
 └── Batch 2 (parallel): Tasks 4, 5, 6 → depend on batch 1
     └── [same pattern]
 ```
 
+Key: Reviewers start **immediately** when their implementer finishes - no waiting for the whole batch.
+
 #### Per-Task Cycle
 
 Each task gets its own implement→review loop:
 
-1. Spawn implementer with task details
-2. Spawn reviewer to check implementation
-3. If changes requested → re-spawn implementer (max 3 cycles)
-4. Mark as DONE or BLOCKED
+1. Fire implementer via `background_task`
+2. Implementer: make changes → run tests → **commit** if passing
+3. Fire reviewer to check implementation
+4. If changes requested → fire new implementer (max 3 cycles)
+5. Mark as DONE or BLOCKED
+
+**Note:** Implementer commits after verification passes, using the commit message from the plan.
 
 ### 4. Session Continuity
 
@@ -233,10 +257,28 @@ Searches across:
 | `ast_grep_replace` | AST-aware code pattern replacement |
 | `look_at` | Extract file structure for large files |
 | `artifact_search` | Search past plans and ledgers |
-| `background_task` | Run long-running tasks in background |
-| `background_output` | Check background task status/output |
-| `background_cancel` | Cancel background tasks |
-| `background_list` | List all background tasks |
+| `btca_ask` | Query library source code (requires btca CLI) |
+| `background_task` | Fire subagent to run in background, returns task_id |
+| `background_list` | List all tasks and status (use to poll for completion) |
+| `background_output` | Get results from completed task |
+| `background_cancel` | Cancel running task(s) |
+
+### Background Task Pattern
+
+All agents use the **fire-poll-collect** pattern for parallel work:
+
+```
+# FIRE: Launch all in ONE message
+task_1 = background_task(agent="locator", prompt="...")
+task_2 = background_task(agent="analyzer", prompt="...")
+
+# POLL: Check until complete
+background_list()  # repeat until all show "completed"
+
+# COLLECT: Get results
+background_output(task_id=task_1)
+background_output(task_id=task_2)
+```
 
 ## Hooks
 

From ea234f78585138d2bc6d2ad8423d5fcbfc8e0bc3 Mon Sep 17 00:00:00 2001
From: Vlad Temian <vladtemian@gmail.com>
Date: Sat, 3 Jan 2026 14:51:23 +0200
Subject: [PATCH 14/14] fix: handle error status in polling and fix README
 accuracy

- Poll until tasks show 'completed' or 'error' (not just completed)
- Skip errored tasks when collecting results
- Fix README: clarify which agents use which pattern
---
 README.md                         | 6 +++---
 src/agents/brainstormer.ts        | 4 ++--
 src/agents/planner.ts             | 4 ++--
 src/agents/project-initializer.ts | 8 ++++----
 4 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/README.md b/README.md
index 222290f..3fc2806 100644
--- a/README.md
+++ b/README.md
@@ -265,7 +265,7 @@ Searches across:
 
 ### Background Task Pattern
 
-All agents use the **fire-poll-collect** pattern for parallel work:
+Research agents (brainstormer, planner, project-initializer) use the **fire-poll-collect** pattern. Executor uses **fire-and-check** (starts reviewers as implementers complete).
 
 ```
 # FIRE: Launch all in ONE message
@@ -273,9 +273,9 @@ task_1 = background_task(agent="locator", prompt="...")
 task_2 = background_task(agent="analyzer", prompt="...")
 
 # POLL: Check until complete
-background_list()  # repeat until all show "completed"
+background_list()  # repeat until all show "completed" or "error"
 
-# COLLECT: Get results
+# COLLECT: Get results (skip errored tasks)
 background_output(task_id=task_1)
 background_output(task_id=task_2)
 ```
diff --git a/src/agents/brainstormer.ts b/src/agents/brainstormer.ts
index b19343f..22d560f 100644
--- a/src/agents/brainstormer.ts
+++ b/src/agents/brainstormer.ts
@@ -52,10 +52,10 @@ This is DESIGN ONLY. The planner agent handles detailed implementation plans.
     background_task(agent="pattern-finder", prompt="Find patterns for [similar functionality]", description="Find patterns")
   </fire-example>
   <poll>
-    background_list()  // repeat until all show "completed"
+    background_list()  // repeat until all show "completed" or "error"
   </poll>
   <collect>
-    background_output(task_id=...) for each completed task
+    background_output(task_id=...) for each completed task (skip errored tasks)
   </collect>
   <focus>purpose, constraints, success criteria</focus>
 </phase>
diff --git a/src/agents/planner.ts b/src/agents/planner.ts
index 3c767d0..74180ae 100644
--- a/src/agents/planner.ts
+++ b/src/agents/planner.ts
@@ -87,8 +87,8 @@ All research must serve the design - never second-guess design decisions.
     - btca_ask for library internals when needed
   </fire-phase>
   <collect-phase description="Poll until all complete, then collect">
-    - Poll with background_list until all tasks show completed
-    - Call background_output(task_id=...) for each completed task
+    - Poll with background_list until all tasks show completed or error
+    - Call background_output(task_id=...) for each completed task (skip errored)
     - Combine all results for planning phase
   </collect-phase>
   <rule>Only research what's needed to implement the design</rule>
diff --git a/src/agents/project-initializer.ts b/src/agents/project-initializer.ts
index 8e475a5..a720b9b 100644
--- a/src/agents/project-initializer.ts
+++ b/src/agents/project-initializer.ts
@@ -60,8 +60,8 @@ const PROMPT = `
 
     <phase name="2-collect" description="Poll and collect all results">
       <description>Poll background_list until all tasks complete, then collect with background_output</description>
-      <action>Poll background_list until all tasks show "completed"</action>
-      <action>Call background_output for each completed task</action>
+      <action>Poll background_list until all tasks show "completed" or "error"</action>
+      <action>Call background_output for each completed task (skip errored)</action>
       <action>Process tool results from phase 1</action>
     </phase>
 
@@ -229,8 +229,8 @@ const PROMPT = `
 
     <step description="COLLECT: Poll and gather all results">
       First poll until all tasks complete:
-      - background_list()  // repeat until all show "completed"
-      Then collect ALL results:
+      - background_list()  // repeat until all show "completed" or "error"
+      Then collect results (skip errored tasks):
       - background_output(task_id=task_id_1)
       - background_output(task_id=task_id_2)
       - background_output(task_id=task_id_3)